From c56648907e044bfde716efe803a1b4e78bf52eff Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Fri, 23 Aug 2024 13:07:20 +0200 Subject: [PATCH 01/15] draft data dictionary --- data-raw/data_dictionary.R | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) create mode 100644 data-raw/data_dictionary.R diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R new file mode 100644 index 00000000..0280ca7e --- /dev/null +++ b/data-raw/data_dictionary.R @@ -0,0 +1,19 @@ +# Data dictionary for the output table company_technology_deviation_tms +dd_company_technology_deviation_tms <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "company_technology_deviation_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "company_technology_deviation_tms", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "company_technology_deviation_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_technology_deviation_tms", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "company_technology_deviation_tms", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "company_technology_deviation_tms", "name_abcd", "character", "The name of the company", "The name of the company", + "company_technology_deviation_tms", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_technology_deviation_tms", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_technology_deviation_tms", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", + "company_technology_deviation_tms", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", + "company_technology_deviation_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" +) + +data_dictionary <- dplyr::bind_rows(dd_company_technology_deviation_tms) + +usethis::use_data(data_dictionary, overwrite = TRUE) From 6219fddfacb2481cb470f4dab1000a3faeab08ea Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 26 Aug 2024 11:30:57 +0200 Subject: [PATCH 02/15] add placeholders data_dictionary --- data-raw/data_dictionary.R | 60 +++++++++++++++++++++++++++++++++++++- 1 file changed, 59 insertions(+), 1 deletion(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index 0280ca7e..d21667fe 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -14,6 +14,64 @@ dd_company_technology_deviation_tms <- dplyr::tribble( "company_technology_deviation_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" ) -data_dictionary <- dplyr::bind_rows(dd_company_technology_deviation_tms) +# TODO +dd_company_alignment_net_tms <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "company_alignment_net_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "company_alignment_net_tms", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "company_alignment_net_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_net_tms", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "company_alignment_net_tms", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "company_alignment_net_tms", "name_abcd", "character", "The name of the company", "The name of the company", + "company_alignment_net_tms", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_alignment_net_tms", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_alignment_net_tms", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", + "company_alignment_net_tms", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", + "company_alignment_net_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" +) + +# TODO +dd_company_alignment_bo_po_tms <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "company_alignment_bo_po_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "company_alignment_bo_po_tms", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "company_alignment_bo_po_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_bo_po_tms", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "company_alignment_bo_po_tms", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "company_alignment_bo_po_tms", "name_abcd", "character", "The name of the company", "The name of the company", + "company_alignment_bo_po_tms", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_alignment_bo_po_tms", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_alignment_bo_po_tms", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", + "company_alignment_bo_po_tms", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", + "company_alignment_bo_po_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" +) + +# TODO +dd_company_alignment_net_sda <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "company_alignment_net_sda", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "company_alignment_net_sda", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "company_alignment_net_sda", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_net_sda", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "company_alignment_net_sda", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "company_alignment_net_sda", "name_abcd", "character", "The name of the company", "The name of the company", + "company_alignment_net_sda", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_alignment_net_sda", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", + "company_alignment_net_sda", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", + "company_alignment_net_sda", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", + "company_alignment_net_sda", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" +) + +# TODO: company_exposure_bo_po_aggregate_alignment<_by_...> +# TODO: company_exposure_net_aggregate_alignment<_by_...> +# TODO: loanbook_exposure_bo_po_aggregate_alignment<_by_...> +# TODO: loanbook_exposure_net_aggregate_alignment<_by_...> + +data_dictionary <- dplyr::bind_rows( + dd_company_technology_deviation_tms, + dd_company_alignment_net_tms, + dd_company_alignment_bo_po_tms, + dd_company_alignment_net_sda +) usethis::use_data(data_dictionary, overwrite = TRUE) From 6fb97d2851821e995667ebc83919d8aaa17d2684 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 26 Aug 2024 12:21:46 +0200 Subject: [PATCH 03/15] add explanations --- data-raw/data_dictionary.R | 34 +++++++++++++++------------------- 1 file changed, 15 insertions(+), 19 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index d21667fe..ea0dfafb 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -10,40 +10,36 @@ dd_company_technology_deviation_tms <- dplyr::tribble( "company_technology_deviation_tms", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", "company_technology_deviation_tms", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", "company_technology_deviation_tms", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", - "company_technology_deviation_tms", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", + "company_technology_deviation_tms", "direction", "character", "The direction the technology follows long term in the scenario", "One of the following: 'buildout', 'phaseout'", "company_technology_deviation_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" ) -# TODO dd_company_alignment_net_tms <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, + "company_alignment_net_tms", "name_abcd", "character", "The name of the company", "The name of the company", "company_alignment_net_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", - "company_alignment_net_tms", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", - "company_alignment_net_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_net_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", "company_alignment_net_tms", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", "company_alignment_net_tms", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", - "company_alignment_net_tms", "name_abcd", "character", "The name of the company", "The name of the company", - "company_alignment_net_tms", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", - "company_alignment_net_tms", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", - "company_alignment_net_tms", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", - "company_alignment_net_tms", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", - "company_alignment_net_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" + "company_alignment_net_tms", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "company_alignment_net_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_net_tms", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'net'", + "company_alignment_net_tms", "total_deviation", "double", "Net aggregate deviation of all underlying technologies, accounting for directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", + "company_alignment_net_tms", "alignment_metric", "double", "Net aggregate alignment value by sector. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" ) -# TODO dd_company_alignment_bo_po_tms <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, + "company_alignment_bo_po_tms", "name_abcd", "character", "The name of the company", "The name of the company", "company_alignment_bo_po_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", - "company_alignment_bo_po_tms", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", - "company_alignment_bo_po_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_bo_po_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", "company_alignment_bo_po_tms", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", "company_alignment_bo_po_tms", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", - "company_alignment_bo_po_tms", "name_abcd", "character", "The name of the company", "The name of the company", - "company_alignment_bo_po_tms", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", - "company_alignment_bo_po_tms", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", - "company_alignment_bo_po_tms", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", - "company_alignment_bo_po_tms", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", - "company_alignment_bo_po_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" + "company_alignment_bo_po_tms", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "company_alignment_bo_po_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_bo_po_tms", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'buildout' or 'phaseout'", + "company_alignment_bo_po_tms", "total_deviation", "double", "Aggregate deviation of all underlying technologies of the same directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", + "company_alignment_bo_po_tms", "alignment_metric", "double", "Net aggregate alignment value by sector, disaggregated by direction of the underlying technlogies. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" ) # TODO From 75bbc3a6fd3e56dabd7e0dd2b97e745b3e6da3e3 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 26 Aug 2024 12:30:59 +0200 Subject: [PATCH 04/15] more explanations --- data-raw/data_dictionary.R | 17 ++++++++--------- 1 file changed, 8 insertions(+), 9 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index ea0dfafb..bc237191 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -45,17 +45,16 @@ dd_company_alignment_bo_po_tms <- dplyr::tribble( # TODO dd_company_alignment_net_sda <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, - "company_alignment_net_sda", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", - "company_alignment_net_sda", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", - "company_alignment_net_sda", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_net_sda", "name_abcd", "character", "The name of the company", "The name of the company", + "company_alignment_net_sda", "sector", "character", "The sector of the technology", "One of the following: 'aviation', 'cement', 'steel'", + "company_alignment_net_sda", "activity_unit", "character", "The unit the physical emission intensity is measured in for a given sector", "The unit corresponding to the sector. For example 'tCO2 / t cement'", "company_alignment_net_sda", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", "company_alignment_net_sda", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", - "company_alignment_net_sda", "name_abcd", "character", "The name of the company", "The name of the company", - "company_alignment_net_sda", "projected", "double", "The projected activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", - "company_alignment_net_sda", "target_", "double", "The target activity level of the technology in the year for the given company", "Numerical value greater or equal to 0", - "company_alignment_net_sda", "total_tech_deviation", "double", "The total difference between 'target_' and 'projected'", "Numerical value. Can be negative or positive", - "company_alignment_net_sda", "direction", "character", "The direction of the technology. Follows long term scenario requirements", "One of the following: 'buildout', 'phaseout'", - "company_alignment_net_sda", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power" + "company_alignment_net_sda", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "company_alignment_net_sda", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_alignment_net_sda", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'net'", + "company_alignment_net_sda", "total_deviation", "double", "Net aggregate deviation of all underlying technologies, accounting for directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", + "company_alignment_net_sda", "alignment_metric", "double", "Net aggregate alignment value by sector. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" ) # TODO: company_exposure_bo_po_aggregate_alignment<_by_...> From e6f587eb66862b5f3380b3139821f99feb86c057 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 26 Aug 2024 15:49:02 +0200 Subject: [PATCH 05/15] more explanations --- data-raw/data_dictionary.R | 72 +++++++++++++++++++++++++++++++++++--- 1 file changed, 68 insertions(+), 4 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index bc237191..b8c743eb 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -42,7 +42,6 @@ dd_company_alignment_bo_po_tms <- dplyr::tribble( "company_alignment_bo_po_tms", "alignment_metric", "double", "Net aggregate alignment value by sector, disaggregated by direction of the underlying technlogies. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" ) -# TODO dd_company_alignment_net_sda <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, "company_alignment_net_sda", "name_abcd", "character", "The name of the company", "The name of the company", @@ -57,16 +56,81 @@ dd_company_alignment_net_sda <- dplyr::tribble( "company_alignment_net_sda", "alignment_metric", "double", "Net aggregate alignment value by sector. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" ) -# TODO: company_exposure_bo_po_aggregate_alignment<_by_...> -# TODO: company_exposure_net_aggregate_alignment<_by_...> +dd_company_exposure_bo_po_aggregate_alignment <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "company_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", + "company_exposure_bo_po_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", + "company_exposure_bo_po_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "company_exposure_bo_po_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", + "company_exposure_bo_po_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "company_exposure_bo_po_aggregate_alignment", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "company_exposure_bo_po_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "company_exposure_bo_po_aggregate_alignment", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_exposure_bo_po_aggregate_alignment", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'buildout' or 'phaseout'", + "company_exposure_bo_po_aggregate_alignment", "total_deviation", "double", "Aggregate deviation of all underlying technologies of the same directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", + "company_exposure_bo_po_aggregate_alignment", "alignment_metric", "double", "Net aggregate alignment value by sector, disaggregated by direction of the underlying technlogies. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive", + "company_exposure_bo_po_aggregate_alignment", "loan_size_outstanding_currency", "character", "Denomination of the loans listed in the given banking book", "Three letter currency code following the ISO 4217 standard. Only one currency allowed per banking book", + "company_exposure_bo_po_aggregate_alignment", "loan_size_outstanding", "double", "Remaining outstanding loan value to the given counterparty", "Numerical value greater or equal to 0", + "company_exposure_bo_po_aggregate_alignment", "exposure_weight", "double", "Relative size of the loan compared to the overall size of the analysed banking book", "Numerical value greater or equal to 0" +) + +dd_company_exposure_net_aggregate_alignment <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "company_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", + "company_exposure_net_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", + "company_exposure_net_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", + "company_exposure_net_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", + "company_exposure_net_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "company_exposure_net_aggregate_alignment", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "company_exposure_net_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "company_exposure_net_aggregate_alignment", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "company_exposure_net_aggregate_alignment", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'net'", + "company_exposure_net_aggregate_alignment", "total_deviation", "double", "Aggregate deviation of all underlying technologies of the same directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", + "company_exposure_net_aggregate_alignment", "alignment_metric", "double", "Net aggregate alignment value by sector. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive", + "company_exposure_net_aggregate_alignment", "loan_size_outstanding_currency", "character", "Denomination of the loans listed in the given banking book", "Three letter currency code following the ISO 4217 standard. Only one currency allowed per banking book", + "company_exposure_net_aggregate_alignment", "loan_size_outstanding", "double", "Remaining outstanding loan value to the given counterparty", "Numerical value greater or equal to 0", + "company_exposure_net_aggregate_alignment", "exposure_weight", "double", "Relative size of the loan compared to the overall size of the analysed banking book", "Numerical value greater or equal to 0" +) + # TODO: loanbook_exposure_bo_po_aggregate_alignment<_by_...> +dd_loanbook_exposure_bo_po_aggregate_alignment <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "loanbook_exposure_bo_po_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", + "loanbook_exposure_bo_po_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "loanbook_exposure_bo_po_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", + "loanbook_exposure_bo_po_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "loanbook_exposure_bo_po_aggregate_alignment", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "loanbook_exposure_bo_po_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "loanbook_exposure_bo_po_aggregate_alignment", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "loanbook_exposure_bo_po_aggregate_alignment", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'buildout' or 'phaseout'", + "loanbook_exposure_bo_po_aggregate_alignment", "total_deviation", "double", "Aggregate deviation of all underlying technologies of the same directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", + "loanbook_exposure_bo_po_aggregate_alignment", "alignment_metric", "double", "Net aggregate alignment value by sector, disaggregated by direction of the underlying technlogies. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" +) + # TODO: loanbook_exposure_net_aggregate_alignment<_by_...> +dd_loanbook_exposure_net_aggregate_alignment <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "loanbook_exposure_net_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", + "loanbook_exposure_net_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "loanbook_exposure_net_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", + "loanbook_exposure_net_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "loanbook_exposure_net_aggregate_alignment", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "loanbook_exposure_net_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "loanbook_exposure_net_aggregate_alignment", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "loanbook_exposure_net_aggregate_alignment", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'buildout' or 'phaseout'", + "loanbook_exposure_net_aggregate_alignment", "total_deviation", "double", "Aggregate deviation of all underlying technologies of the same directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", + "loanbook_exposure_net_aggregate_alignment", "alignment_metric", "double", "Net aggregate alignment value by sector, disaggregated by direction of the underlying technlogies. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" +) data_dictionary <- dplyr::bind_rows( dd_company_technology_deviation_tms, dd_company_alignment_net_tms, dd_company_alignment_bo_po_tms, - dd_company_alignment_net_sda + dd_company_alignment_net_sda, + dd_company_exposure_bo_po_aggregate_alignment, + dd_company_exposure_net_aggregate_alignment, + dd_loanbook_exposure_bo_po_aggregate_alignment, + dd_loanbook_exposure_net_aggregate_alignment ) usethis::use_data(data_dictionary, overwrite = TRUE) From cd1f00bc05a3dd7b71975daa8bdd42463daa181e Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 26 Aug 2024 16:55:55 +0200 Subject: [PATCH 06/15] more explanations --- data-raw/data_dictionary.R | 35 ++++++++++++++++++----------------- 1 file changed, 18 insertions(+), 17 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index b8c743eb..75bdb9d6 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -92,34 +92,35 @@ dd_company_exposure_net_aggregate_alignment <- dplyr::tribble( "company_exposure_net_aggregate_alignment", "exposure_weight", "double", "Relative size of the loan compared to the overall size of the analysed banking book", "Numerical value greater or equal to 0" ) -# TODO: loanbook_exposure_bo_po_aggregate_alignment<_by_...> dd_loanbook_exposure_bo_po_aggregate_alignment <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, - "loanbook_exposure_bo_po_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", - "loanbook_exposure_bo_po_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", - "loanbook_exposure_bo_po_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", - "loanbook_exposure_bo_po_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", - "loanbook_exposure_bo_po_aggregate_alignment", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "loanbook_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", "loanbook_exposure_bo_po_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "loanbook_exposure_bo_po_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "loanbook_exposure_bo_po_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", "loanbook_exposure_bo_po_aggregate_alignment", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", "loanbook_exposure_bo_po_aggregate_alignment", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'buildout' or 'phaseout'", - "loanbook_exposure_bo_po_aggregate_alignment", "total_deviation", "double", "Aggregate deviation of all underlying technologies of the same directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", - "loanbook_exposure_bo_po_aggregate_alignment", "alignment_metric", "double", "Net aggregate alignment value by sector, disaggregated by direction of the underlying technlogies. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" + "loanbook_exposure_bo_po_aggregate_alignment", "n_companies", "double", "Number of individual company-by-sector combinations in the given sector analysed within this (group of) banking book(s)", "Numerical value greater or equal to 0", + "loanbook_exposure_bo_po_aggregate_alignment", "n_companies_aligned", "double", "Number of individual company-by-sector combinations within the given sector that have an alignment metric greater or equal to 0", "Numerical value greater or equal to 0 and smaller or equal to 'n_companies'", + "loanbook_exposure_bo_po_aggregate_alignment", "share_companies_aligned", "double", "Share of 'n_companies_aligned' relative to 'n_companies'", "Numerical value. Must be between 0 and 1", + "loanbook_exposure_bo_po_aggregate_alignment", "exposure_weighted_net_alignment", "double", "Net aggregate alignment value aggregated to the banking book-by-sector level, disaggregated into 'buildout' and 'phaseout' components. Individual company alignment metrics are allocated based on financial exposure, using the 'exposure_weight'", "Numerical value. Can be negative or positive" ) -# TODO: loanbook_exposure_net_aggregate_alignment<_by_...> dd_loanbook_exposure_net_aggregate_alignment <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, - "loanbook_exposure_net_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", - "loanbook_exposure_net_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", - "loanbook_exposure_net_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", - "loanbook_exposure_net_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", - "loanbook_exposure_net_aggregate_alignment", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "loanbook_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", "loanbook_exposure_net_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "loanbook_exposure_net_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "loanbook_exposure_net_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", "loanbook_exposure_net_aggregate_alignment", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", - "loanbook_exposure_net_aggregate_alignment", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'buildout' or 'phaseout'", - "loanbook_exposure_net_aggregate_alignment", "total_deviation", "double", "Aggregate deviation of all underlying technologies of the same directionality. A more positive number means that the combination of underlying technologies is more aligned, a more negative one implies higher misalignment", "Numerical value. Can be negative or positive", - "loanbook_exposure_net_aggregate_alignment", "alignment_metric", "double", "Net aggregate alignment value by sector, disaggregated by direction of the underlying technlogies. A ratio that is calculated as the total deviation divided by the net scenario value (accounting for directionality). A positive value shows the company plans are ahead of target. A negative value means they are behind target", "Numerical value. Can be negative or positive" + "loanbook_exposure_net_aggregate_alignment", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'net'", + "loanbook_exposure_net_aggregate_alignment", "n_companies", "double", "Number of individual company-by-sector combinations in the given sector analysed within this (group of) banking book(s)", "Numerical value greater or equal to 0", + "loanbook_exposure_net_aggregate_alignment", "n_companies_aligned", "double", "Number of individual company-by-sector combinations within the given sector that have an alignment metric greater or equal to 0", "Numerical value greater or equal to 0 and smaller or equal to 'n_companies'", + "loanbook_exposure_net_aggregate_alignment", "share_companies_aligned", "double", "Share of 'n_companies_aligned' relative to 'n_companies'", "Numerical value. Must be between 0 and 1", + "loanbook_exposure_net_aggregate_alignment", "exposure_weighted_net_alignment", "double", "Net aggregate alignment value aggregated to the banking book-by-sector level. Individual company alignment metrics are allocated based on financial exposure, using the 'exposure_weight'", "Numerical value. Can be negative or positive", + "loanbook_exposure_net_aggregate_alignment", "sum_loan_size_outstanding", "double", "Sum of outstanding loan size at the banking book-by-sector level of all loans analysed within this (group of) banking book(s)", "Numerical value greater or equal to 0", + "loanbook_exposure_net_aggregate_alignment", "sum_exposure_companies_aligned", "double", "Sum of outstanding loan size at the banking book-by-sector level of all loans to aligned companies within this (group of) banking book(s)", "Numerical value greater or equal to 0 and smaller or equal to 'sum_loan_size_outstanding'", + "loanbook_exposure_net_aggregate_alignment", "share_exposure_aligned", "double", "Share of 'sum_exposure_companies_aligned' relative to 'sum_loan_size_outstanding'", "Numerical value. Must be between 0 and 1" ) data_dictionary <- dplyr::bind_rows( From e9c69d33dbdb302de5deaf26c386d8c5a83e9a0b Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 26 Aug 2024 18:02:41 +0200 Subject: [PATCH 07/15] style --- data-raw/data_dictionary.R | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index 75bdb9d6..439b5a04 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -1,6 +1,6 @@ # Data dictionary for the output table company_technology_deviation_tms dd_company_technology_deviation_tms <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "company_technology_deviation_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", "company_technology_deviation_tms", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", "company_technology_deviation_tms", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", @@ -15,7 +15,7 @@ dd_company_technology_deviation_tms <- dplyr::tribble( ) dd_company_alignment_net_tms <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "company_alignment_net_tms", "name_abcd", "character", "The name of the company", "The name of the company", "company_alignment_net_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", "company_alignment_net_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", @@ -29,7 +29,7 @@ dd_company_alignment_net_tms <- dplyr::tribble( ) dd_company_alignment_bo_po_tms <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "company_alignment_bo_po_tms", "name_abcd", "character", "The name of the company", "The name of the company", "company_alignment_bo_po_tms", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", "company_alignment_bo_po_tms", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", @@ -43,7 +43,7 @@ dd_company_alignment_bo_po_tms <- dplyr::tribble( ) dd_company_alignment_net_sda <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "company_alignment_net_sda", "name_abcd", "character", "The name of the company", "The name of the company", "company_alignment_net_sda", "sector", "character", "The sector of the technology", "One of the following: 'aviation', 'cement', 'steel'", "company_alignment_net_sda", "activity_unit", "character", "The unit the physical emission intensity is measured in for a given sector", "The unit corresponding to the sector. For example 'tCO2 / t cement'", @@ -57,7 +57,7 @@ dd_company_alignment_net_sda <- dplyr::tribble( ) dd_company_exposure_bo_po_aggregate_alignment <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "company_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", "company_exposure_bo_po_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", "company_exposure_bo_po_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", @@ -75,7 +75,7 @@ dd_company_exposure_bo_po_aggregate_alignment <- dplyr::tribble( ) dd_company_exposure_net_aggregate_alignment <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "company_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", "company_exposure_net_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", "company_exposure_net_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", @@ -93,7 +93,7 @@ dd_company_exposure_net_aggregate_alignment <- dplyr::tribble( ) dd_loanbook_exposure_bo_po_aggregate_alignment <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "loanbook_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", "loanbook_exposure_bo_po_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", "loanbook_exposure_bo_po_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", @@ -107,7 +107,7 @@ dd_loanbook_exposure_bo_po_aggregate_alignment <- dplyr::tribble( ) dd_loanbook_exposure_net_aggregate_alignment <- dplyr::tribble( - ~dataset, ~column, ~typeof, ~definition, ~value, + ~dataset, ~column, ~typeof, ~definition, ~value, "loanbook_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", "loanbook_exposure_net_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", "loanbook_exposure_net_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", From ee44f1eaf55da887aa6b9cd1172b7ae7512091a2 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Tue, 27 Aug 2024 10:33:43 +0200 Subject: [PATCH 08/15] comments --- data-raw/data_dictionary.R | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index 439b5a04..ca8ed783 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -123,6 +123,26 @@ dd_loanbook_exposure_net_aggregate_alignment <- dplyr::tribble( "loanbook_exposure_net_aggregate_alignment", "share_exposure_aligned", "double", "Share of 'sum_exposure_companies_aligned' relative to 'sum_loan_size_outstanding'", "Numerical value. Must be between 0 and 1" ) +# TODO: data_sankey_<...> +# TODO: data_sankey_company_<...> +# TODO: data_scatter_alignment_exposure_<...> +# TODO: data_scatter__<...> +# TODO: data_scatter__company_<...> +# TODO: data_timeline_net__<...> +# TODO: data_timeline_bo_po__<...> + +# TODO: tms_results_all_groups +# TODO: sda_results_all_groups +# TODO: data_tech_mix__<...> +# TODO: data_trajectory___<...> +# TODO: data_emission_intensity__<...> +# TODO: companies_included__<...> + +# TODO: summary_statistics_loanbook_coverage + +# TODO: add tabular output for match_success_rate + + data_dictionary <- dplyr::bind_rows( dd_company_technology_deviation_tms, dd_company_alignment_net_tms, From 3c05fb4968b3e92517303f940d4e461f63e93b14 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Tue, 27 Aug 2024 11:54:33 +0200 Subject: [PATCH 09/15] more information --- data-raw/data_dictionary.R | 96 +++++++++++++++++++++++++++++++++----- 1 file changed, 84 insertions(+), 12 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index ca8ed783..27180180 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -58,7 +58,7 @@ dd_company_alignment_net_sda <- dplyr::tribble( dd_company_exposure_bo_po_aggregate_alignment <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, - "company_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", + "company_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", "company_exposure_bo_po_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", "company_exposure_bo_po_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", "company_exposure_bo_po_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", @@ -76,7 +76,7 @@ dd_company_exposure_bo_po_aggregate_alignment <- dplyr::tribble( dd_company_exposure_net_aggregate_alignment <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, - "company_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", + "company_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", "company_exposure_net_aggregate_alignment", "name_abcd", "character", "The name of the company", "The name of the company", "company_exposure_net_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", "company_exposure_net_aggregate_alignment", "activity_unit", "character", "The unit the activity is measured in for a given sector", "The unit corresponding to the sector. For example 'MW' of capacity for power", @@ -94,7 +94,7 @@ dd_company_exposure_net_aggregate_alignment <- dplyr::tribble( dd_loanbook_exposure_bo_po_aggregate_alignment <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, - "loanbook_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", + "loanbook_exposure_bo_po_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", "loanbook_exposure_bo_po_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", "loanbook_exposure_bo_po_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", "loanbook_exposure_bo_po_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", @@ -108,7 +108,7 @@ dd_loanbook_exposure_bo_po_aggregate_alignment <- dplyr::tribble( dd_loanbook_exposure_net_aggregate_alignment <- dplyr::tribble( ~dataset, ~column, ~typeof, ~definition, ~value, - "loanbook_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value", + "loanbook_exposure_net_aggregate_alignment", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", "loanbook_exposure_net_aggregate_alignment", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", "loanbook_exposure_net_aggregate_alignment", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", "loanbook_exposure_net_aggregate_alignment", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", @@ -123,13 +123,79 @@ dd_loanbook_exposure_net_aggregate_alignment <- dplyr::tribble( "loanbook_exposure_net_aggregate_alignment", "share_exposure_aligned", "double", "Share of 'sum_exposure_companies_aligned' relative to 'sum_loan_size_outstanding'", "Numerical value. Must be between 0 and 1" ) -# TODO: data_sankey_<...> -# TODO: data_sankey_company_<...> -# TODO: data_scatter_alignment_exposure_<...> -# TODO: data_scatter__<...> -# TODO: data_scatter__company_<...> -# TODO: data_timeline_net__<...> -# TODO: data_timeline_bo_po__<...> +dd_data_sankey <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_sankey", "", "character", "Leftmost node in the sankey plot. Defines the split of the banking books into groups. Any additional descriptor either at the loan level or at the banking book level", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "data_sankey", "middle_node", "character", "Middle node in the sankey plot. A different grouping of interest. E.g. 'sector' would split the financial exposures according to sectoral exposure", "Must be available in the exposure alignment results used as input for the graph", + "data_sankey", "middle_node2", "character", "Optional: An additional middle node can be added for further disaggregation of exposures in the sankey plot", "Must be available in the exposure alignment results used as input for the graph", + "data_sankey", "is_aligned", "logical", "End node and color indicator. A dummy variable that indicates if the underlying counterparty related to the exposure is aligned based on the net alignment metric or not", "Value is either 'Aligned' or 'Not aligned'", + "data_sankey", "loan_size_outstanding", "double", "Remaining outstanding loan value to the underlying counterparty", "Numerical value greater or equal to 0" +) + +dd_data_scatter_alignment_exposure <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_scatter_alignment_exposure", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "data_scatter_alignment_exposure", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "data_scatter_alignment_exposure", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "data_scatter_alignment_exposure", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", + "data_scatter_alignment_exposure", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "data_scatter_alignment_exposure", "exposure_weighted_net_alignment", "double", "Net aggregate alignment value aggregated to the banking book-by-sector level. Individual company alignment metrics are allocated based on financial exposure, using the 'exposure_weight'", "Numerical value. Can be negative or positive", + "data_scatter_alignment_exposure", "sum_loan_size_outstanding", "double", "Sum of outstanding loan size at the banking book-by-sector level of all loans analysed within this (group of) banking book(s)", "Numerical value greater or equal to 0" +) + +# TODO: currently the sector is only indicated by the file name, not by a column in the data +dd_data_scatter_sector <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_scatter_sector", "name", "character", "Name of the entity to analyse. If analysed at group level, this variable contains the values of . If analysed at company level, it contains the values of 'name_abcd'", "An identifying name of the entity", + "data_scatter_sector", "buildout", "character", "Net aggregate alignment value by sector, disaggregated to buildout technologies only", "Numerical value. Can be negative or positive", + "data_scatter_sector", "phaseout", "character", "Net aggregate alignment value by sector, disaggregated to phaseout technologies only", "Numerical value. Can be negative or positive", + "data_scatter_sector", "net", "character", "Net aggregate alignment value by sector of the entity analysed", "Numerical value. Can be negative or positive. Sum of the disaggregated components of 'buildout' and 'phaseout'", + "data_scatter_sector", "datapoint", "character", "The level of the analysis, either group level or company level", "Must be one of: 'Group' or 'company'" +) + +# TODO: currently the sector is only indicated by the file name, not by a column in the data +dd_data_scatter_sector_animated <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_scatter_sector_animated", "name", "character", "Name of the entity to analyse. If analysed at group level, this variable contains the values of . If analysed at company level, it contains the values of 'name_abcd'", "An identifying name of the entity", + "data_scatter_sector_animated", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "data_scatter_sector_animated", "buildout", "character", "Net aggregate alignment value by sector, disaggregated to buildout technologies only", "Numerical value. Can be negative or positive", + "data_scatter_sector_animated", "phaseout", "character", "Net aggregate alignment value by sector, disaggregated to phaseout technologies only", "Numerical value. Can be negative or positive", + "data_scatter_sector_animated", "net", "character", "Net aggregate alignment value by sector of the entity analysed", "Numerical value. Can be negative or positive. Sum of the disaggregated components of 'buildout' and 'phaseout'", + "data_scatter_sector_animated", "datapoint", "character", "The level of the analysis, either group level or company level", "Must be one of: 'Group' or 'company'" +) + +# same as loanbook_exposure_net_aggregate_alignment, but filtered for a specific sector +dd_data_timeline_net <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_timeline_net", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "data_timeline_net", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "data_timeline_net", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "data_timeline_net", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", + "data_timeline_net", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "data_timeline_net", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'net'", + "data_timeline_net", "n_companies", "double", "Number of individual company-by-sector combinations in the given sector analysed within this (group of) banking book(s)", "Numerical value greater or equal to 0", + "data_timeline_net", "n_companies_aligned", "double", "Number of individual company-by-sector combinations within the given sector that have an alignment metric greater or equal to 0", "Numerical value greater or equal to 0 and smaller or equal to 'n_companies'", + "data_timeline_net", "share_companies_aligned", "double", "Share of 'n_companies_aligned' relative to 'n_companies'", "Numerical value. Must be between 0 and 1", + "data_timeline_net", "exposure_weighted_net_alignment", "double", "Net aggregate alignment value aggregated to the banking book-by-sector level. Individual company alignment metrics are allocated based on financial exposure, using the 'exposure_weight'", "Numerical value. Can be negative or positive", + "data_timeline_net", "sum_loan_size_outstanding", "double", "Sum of outstanding loan size at the banking book-by-sector level of all loans analysed within this (group of) banking book(s)", "Numerical value greater or equal to 0", + "data_timeline_net", "sum_exposure_companies_aligned", "double", "Sum of outstanding loan size at the banking book-by-sector level of all loans to aligned companies within this (group of) banking book(s)", "Numerical value greater or equal to 0 and smaller or equal to 'sum_loan_size_outstanding'", + "data_timeline_net", "share_exposure_aligned", "double", "Share of 'sum_exposure_companies_aligned' relative to 'sum_loan_size_outstanding'", "Numerical value. Must be between 0 and 1" +) + +# same as loanbook_exposure_bo_po_aggregate_alignment, but filtered for a specific sector +dd_data_timeline_bo_po <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_timeline_bo_po", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "data_timeline_bo_po", "scenario", "character", "The name of the scenario against which alignment is measured", "Must be available in the input scenario data. Must be a scenario provided in the indicated 'scenario_source'", + "data_timeline_bo_po", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "data_timeline_bo_po", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "data_timeline_bo_po", "year", "integer", "The year of the data", "A year between the 'start_year' of the analyis and the 'start_year' plus the 'time_frame'", + "data_timeline_bo_po", "direction", "character", "At the sector level, 'direction' indicates if the alignment value is aggregated across buildout or phaseout technologies, or if it is the net aggregate of the sector.", "In this case, must be: 'buildout' or 'phaseout'", + "data_timeline_bo_po", "n_companies", "double", "Number of individual company-by-sector combinations in the given sector analysed within this (group of) banking book(s)", "Numerical value greater or equal to 0", + "data_timeline_bo_po", "n_companies_aligned", "double", "Number of individual company-by-sector combinations within the given sector that have an alignment metric greater or equal to 0", "Numerical value greater or equal to 0 and smaller or equal to 'n_companies'", + "data_timeline_bo_po", "share_companies_aligned", "double", "Share of 'n_companies_aligned' relative to 'n_companies'", "Numerical value. Must be between 0 and 1", + "data_timeline_bo_po", "exposure_weighted_net_alignment", "double", "Net aggregate alignment value aggregated to the banking book-by-sector level, disaggregated into 'buildout' and 'phaseout' components. Individual company alignment metrics are allocated based on financial exposure, using the 'exposure_weight'", "Numerical value. Can be negative or positive" +) # TODO: tms_results_all_groups # TODO: sda_results_all_groups @@ -151,7 +217,13 @@ data_dictionary <- dplyr::bind_rows( dd_company_exposure_bo_po_aggregate_alignment, dd_company_exposure_net_aggregate_alignment, dd_loanbook_exposure_bo_po_aggregate_alignment, - dd_loanbook_exposure_net_aggregate_alignment + dd_loanbook_exposure_net_aggregate_alignment, + dd_data_sankey, + dd_data_scatter_alignment_exposure, + dd_data_scatter_sector, + dd_data_scatter_sector_animated, + dd_data_timeline_net, + dd_data_timeline_bo_po ) usethis::use_data(data_dictionary, overwrite = TRUE) From 24c3d225a0f3cbe0c21fd92a9876892f4581536c Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Tue, 27 Aug 2024 18:00:51 +0200 Subject: [PATCH 10/15] more documentation --- data-raw/data_dictionary.R | 95 +++++++++++++++++++++++++++++++++++--- 1 file changed, 89 insertions(+), 6 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index 27180180..a0530a0b 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -197,11 +197,89 @@ dd_data_timeline_bo_po <- dplyr::tribble( "data_timeline_bo_po", "exposure_weighted_net_alignment", "double", "Net aggregate alignment value aggregated to the banking book-by-sector level, disaggregated into 'buildout' and 'phaseout' components. Individual company alignment metrics are allocated based on financial exposure, using the 'exposure_weight'", "Numerical value. Can be negative or positive" ) -# TODO: tms_results_all_groups -# TODO: sda_results_all_groups -# TODO: data_tech_mix__<...> -# TODO: data_trajectory___<...> -# TODO: data_emission_intensity__<...> +# TODO: extend variable grouping to standard PACTA and update +dd_tms_results_all_groups <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "tms_results_all_groups", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "tms_results_all_groups", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "tms_results_all_groups", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "tms_results_all_groups", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "tms_results_all_groups", "year", "integer", "The year of the data", "A year greater or equal to the 'start_year' of the analyis", + "tms_results_all_groups", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "tms_results_all_groups", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "tms_results_all_groups", "metric", "character", "Indicates if the production related values refer to the projected activities of the underlying counterparty, to the economy wide benchmark, or to allocated levels of activity based on the scenarios", "Must be one of the following: 'projected', 'corporate_economy', or 'target_'", + "tms_results_all_groups", "production", "double", "The production level of the given 'metric'", "Numerical value greater or equal to 0", + "tms_results_all_groups", "technology_share", "double", "The share of the 'production' the given 'technology' relative to all technologies of the corresponding 'sector' for the gien combination of 'group_id', 'region', 'year' and 'metric'", "Numerical value between 0 and 1", + "tms_results_all_groups", "scope", "character", "Indicates if the targets for the given technology have been calculated based on the TMSR (technology) or the SMSP (sector). High-carbon technologies that need to decrease have their targets calculated on the technology level, whereas low-carbon technologies that need to increase have them calculated on the sector level", "Must be one of: 'technology' or 'sector'", + "tms_results_all_groups", "percentage_of_initial_production_by_scope", "double", "Relative change compared to the start value (by scope). Used for displaying the change in activity over time on a common scale", "Numerical value. Can be negative or positive" +) + +# TODO: extend variable grouping to standard PACTA and update +dd_sda_results_all_groups <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "sda_results_all_groups", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "sda_results_all_groups", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "sda_results_all_groups", "sector", "character", "The sector of the technology", "One of the following: 'aviation', 'cement', 'steel'", + "sda_results_all_groups", "year", "integer", "The year of the data", "A year greater or equal to the 'start_year' of the analyis", + "sda_results_all_groups", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "sda_results_all_groups", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "sda_results_all_groups", "emission_factor_metric", "character", "Indicates if the emission intensity related values refer to the projected activities of the underlying counterparty, to the economy wide benchmark, or to allocated levels of activity based on the scenarios", "Must be one of the following: 'projected', 'corporate_economy', or 'target_'", + "sda_results_all_groups", "emission_factor_value", "double", "The physical emission intensity level of the given 'emission_factor_metric'", "Numerical value greater or equal to 0" +) + +# TODO: extend variable grouping to standard PACTA and update +dd_data_tech_mix <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_tech_mix", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "data_tech_mix", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "data_tech_mix", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "data_tech_mix", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "data_tech_mix", "year", "integer", "The year of the data", "A year greater or equal to the 'start_year' of the analyis", + "data_tech_mix", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "data_tech_mix", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "data_tech_mix", "metric", "character", "Indicates if the production related values refer to the projected activities of the underlying counterparty, to the economy wide benchmark, or to allocated levels of activity based on the scenarios", "Must be one of the following: 'projected', 'corporate_economy', or 'target_'", + "data_tech_mix", "production", "double", "The production level of the given 'metric'", "Numerical value greater or equal to 0", + "data_tech_mix", "technology_share", "double", "The share of the 'production' the given 'technology' relative to all technologies of the corresponding 'sector' for the gien combination of 'group_id', 'region', 'year' and 'metric'", "Numerical value between 0 and 1", + "data_tech_mix", "scope", "character", "Indicates if the targets for the given technology have been calculated based on the TMSR (technology) or the SMSP (sector). High-carbon technologies that need to decrease have their targets calculated on the technology level, whereas low-carbon technologies that need to increase have them calculated on the sector level", "Must be one of: 'technology' or 'sector'", + "data_tech_mix", "percentage_of_initial_production_by_scope", "double", "Relative change compared to the start value (by scope). Used for displaying the change in activity over time on a common scale", "Numerical value. Can be negative or positive", + "data_tech_mix", "label", "character", "Same as 'metric', formatted for display in plot", "Must be one of the following: 'projected', 'corporate_economy', or 'target_', but formatted for display", + "data_tech_mix", "label_tech", "character", "Same as 'technology', formatted for display in plot", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "data_tech_mix", "value", "double", "Same as 'technology_share', for display in plot", "Numerical value between 0 and 1" +) + +# TODO: extend variable grouping to standard PACTA and update +dd_data_trajectory <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_trajectory", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "data_trajectory", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "data_trajectory", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas'", + "data_trajectory", "technology", "character", "The technology", "One of the in-scope PACTA technologies that belong to the sector indicated in 'sector'", + "data_trajectory", "year", "integer", "The year of the data", "A year greater or equal to the 'start_year' of the analyis", + "data_trajectory", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "data_trajectory", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "data_trajectory", "metric", "character", "Indicates if the production related values refer to the projected activities of the underlying counterparty, to the economy wide benchmark, or to allocated levels of activity based on the scenarios", "Must be one of the following: 'projected', 'corporate_economy', or 'target_'", + "data_trajectory", "production", "double", "The production level of the given 'metric'", "Numerical value greater or equal to 0", + "data_trajectory", "technology_share", "double", "The share of the 'production' the given 'technology' relative to all technologies of the corresponding 'sector' for the gien combination of 'group_id', 'region', 'year' and 'metric'", "Numerical value between 0 and 1", + "data_trajectory", "scope", "character", "Indicates if the targets for the given technology have been calculated based on the TMSR (technology) or the SMSP (sector). High-carbon technologies that need to decrease have their targets calculated on the technology level, whereas low-carbon technologies that need to increase have them calculated on the sector level", "Must be one of: 'technology' or 'sector'", + "data_trajectory", "percentage_of_initial_production_by_scope", "double", "Relative change compared to the start value (by scope). Used for displaying the change in activity over time on a common scale", "Numerical value. Can be negative or positive", + "data_trajectory", "label", "character", "Same as 'metric', formatted for display in plot", "Must be one of the following: 'projected', 'corporate_economy', or 'target_', but formatted for display", + "data_trajectory", "value", "double", "Same as 'percentage_of_initial_production_by_scope', for display in plot", "Numerical value. Can be negative or positive" +) + +# TODO: extend variable grouping to standard PACTA and update +dd_data_emission_intensity <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "data_emission_intensity", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "data_emission_intensity", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "data_emission_intensity", "sector", "character", "The sector of the technology", "One of the following: 'aviation', 'cement', 'steel'", + "data_emission_intensity", "year", "integer", "The year of the data", "A year greater or equal to the 'start_year' of the analyis", + "data_emission_intensity", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "data_emission_intensity", "scenario_source", "character", "The publication the scenario data is based on", "Must be available in the input scenario data. Usually, available sources are: 'weo', 'geco', 'isf'. Usually follows the pattern '_'", + "data_emission_intensity", "emission_factor_metric", "character", "Indicates if the emission intensity related values refer to the projected activities of the underlying counterparty, to the economy wide benchmark, or to allocated levels of activity based on the scenarios", "Must be one of the following: 'projected', 'corporate_economy', or 'target_'", + "data_emission_intensity", "emission_factor_value", "double", "The physical emission intensity level of the given 'emission_factor_metric'", "Numerical value greater or equal to 0", + "data_emission_intensity", "label", "character", "Same as 'emission_factor_metric', formatted for display in plot", "Must be one of the following: 'projected', 'corporate_economy', or 'target_', but formatted for display" +) + # TODO: companies_included__<...> # TODO: summary_statistics_loanbook_coverage @@ -223,7 +301,12 @@ data_dictionary <- dplyr::bind_rows( dd_data_scatter_sector, dd_data_scatter_sector_animated, dd_data_timeline_net, - dd_data_timeline_bo_po + dd_data_timeline_bo_po, + dd_tms_results_all_groups, + dd_sda_results_all_groups, + dd_data_tech_mix, + dd_data_trajectory, + dd_data_emission_intensity ) usethis::use_data(data_dictionary, overwrite = TRUE) From 78dc6d314e38b44edc059e79c5c3ab20a51aefeb Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Wed, 28 Aug 2024 10:28:39 +0200 Subject: [PATCH 11/15] add more documentation --- data-raw/data_dictionary.R | 54 +++++++++++++++++++++++++++++++++++--- 1 file changed, 50 insertions(+), 4 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index a0530a0b..30b31168 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -280,11 +280,54 @@ dd_data_emission_intensity <- dplyr::tribble( "data_emission_intensity", "label", "character", "Same as 'emission_factor_metric', formatted for display in plot", "Must be one of the following: 'projected', 'corporate_economy', or 'target_', but formatted for display" ) -# TODO: companies_included__<...> +# TODO: extend variable grouping to standard PACTA and update +# TODO: possibly deprecate this output +dd_companies_included <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "companies_included", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "companies_included", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "companies_included", "name_abcd", "character", "The name of the company", "The name of the company", + "companies_included", "sector_abcd", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", + "companies_included", "loan_size_outstanding", "double", "Remaining outstanding loan value to the given counterparty", "Numerical value greater or equal to 0", + "companies_included", "loan_size_outstanding_currency", "character", "Denomination of the outstanding loans listed in the given banking book", "Three letter currency code following the ISO 4217 standard. Only one currency allowed per banking book", + "companies_included", "loan_size_credit_limit", "double", "Maximum value provided to the a counterparty under the given credit line", "Numerical value greater or equal to 0", + "companies_included", "loan_size_credit_limit_currency", "character", "Denomination of the credit lines of loans listed in the given banking book", "Three letter currency code following the ISO 4217 standard. Only one currency allowed per banking book" +) -# TODO: summary_statistics_loanbook_coverage +# TODO: extend variable grouping to standard PACTA and update +dd_summary_statistics_loanbook_coverage <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "summary_statistics_loanbook_coverage", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "summary_statistics_loanbook_coverage", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "summary_statistics_loanbook_coverage", "region", "character", "The region for which the analysis has been run. Indicates which production assets have been considered and which scenario region is used", "Must be a value available in the input scenario data", + "summary_statistics_loanbook_coverage", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", + "summary_statistics_loanbook_coverage", "total_exposure", "double", "Remaining outstanding loan value to the all companies in the sector that have some operations within the given region", "Numerical value greater or equal to 0", + "summary_statistics_loanbook_coverage", "n_companies_matched", "integer", "Number of companies identified for analysis in the given region and sector. Any matched company is counted regardless of size of exposure", "Integer value greater or equal to 0", + "summary_statistics_loanbook_coverage", "n_companies_total", "integer", "Total number of companies in the reference dataset in the given region and sector", "Integer value greater or equal to 0", + "summary_statistics_loanbook_coverage", "share_companies_matched", "double", "Share of companies identified for analysis relative to total number of companies in the reference dataset. This is a proxy for which part of the economy of a region is covered by the analysis", "Numerical value between 0 and 1", + "summary_statistics_loanbook_coverage", "production_financed", "double", "Sum of production in a sector and region by all companies identfied for analysis. The amount of production is not weighted by exposure", "Numerical value greater or equal to 0", + "summary_statistics_loanbook_coverage", "production_total", "double", "Sum of production in a sector and region by all companies in the reference dataset", "Numerical value greater or equal to 0", + "summary_statistics_loanbook_coverage", "share_production_financed", "double", "Share of production of companies identified for analysis relative to production by all companies in the reference dataset. This is a proxy for how much of the output of a region is covered by the analysis", "Numerical value between 0 and 1" +) -# TODO: add tabular output for match_success_rate +# TODO: extend variable grouping to standard PACTA and update +# TODO: probably better to export data_lbk_match_success_rate, which is actual format used in plots +dd_lbk_match_success_rate <- dplyr::tribble( + ~dataset, ~column, ~typeof, ~definition, ~value, + "lbk_match_success_rate", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", + # "lbk_match_success_rate", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", + "lbk_match_success_rate", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", + "lbk_match_success_rate", "matched", "character", "to be deprecated", "to be deprecated", + "lbk_match_success_rate", "match_n", "double", "Remaining outstanding loan value to the all companies in the sector that have some operations within the given region", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "total_n", "integer", "Number of companies identified for analysis in the given region and sector. Any matched company is counted regardless of size of exposure", "Integer value greater or equal to 0", + "lbk_match_success_rate", "match_success_rate_rel", "integer", "Total number of companies in the reference dataset in the given region and sector", "Integer value greater or equal to 0", + "lbk_match_success_rate", "match_outstanding", "double", "Share of companies identified for analysis relative to total number of companies in the reference dataset. This is a proxy for which part of the economy of a region is covered by the analysis", "Numerical value between 0 and 1", + "lbk_match_success_rate", "total_outstanding", "double", "Sum of production in a sector and region by all companies identfied for analysis. The amount of production is not weighted by exposure", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "match_success_outstanding_rel", "double", "Sum of production in a sector and region by all companies in the reference dataset", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "match_credit_limit", "double", "Share of production of companies identified for analysis relative to production by all companies in the reference dataset. This is a proxy for how much of the output of a region is covered by the analysis", "Numerical value between 0 and 1", + "lbk_match_success_rate", "total_credit_limit", "double", "Sum of production in a sector and region by all companies in the reference dataset", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "match_success_credit_limit_rel", "double", "Share of production of companies identified for analysis relative to production by all companies in the reference dataset. This is a proxy for how much of the output of a region is covered by the analysis", "Numerical value between 0 and 1" +) data_dictionary <- dplyr::bind_rows( @@ -306,7 +349,10 @@ data_dictionary <- dplyr::bind_rows( dd_sda_results_all_groups, dd_data_tech_mix, dd_data_trajectory, - dd_data_emission_intensity + dd_data_emission_intensity, + dd_companies_included, + dd_summary_statistics_loanbook_coverage, + dd_lbk_match_success_rate ) usethis::use_data(data_dictionary, overwrite = TRUE) From b888f9c0b713b00aa84451a6c3417b9bdbd9bde3 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 2 Sep 2024 14:47:25 +0200 Subject: [PATCH 12/15] finish documentation --- data-raw/data_dictionary.R | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index 30b31168..c87f8796 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -317,16 +317,16 @@ dd_lbk_match_success_rate <- dplyr::tribble( "lbk_match_success_rate", "group_id", "character", "Identification of the banking book analysed", "The group_id is automatically generated from the file name of the corresponding raw banking book", # "lbk_match_success_rate", "", "character", "Any additional descriptor either at the loan level or at the banking book level. This is used to calculate grouped results by additional dimensions of interest, such as types of FIs or types of loans", "Any variable name is permissible, that is not already used otherwise. All entries in the banking book should have a corresponding value. NULL is permissible and implies no grouping", "lbk_match_success_rate", "sector", "character", "The sector of the technology", "One of the following: 'power', 'automotive', 'coal', 'oil and gas', 'aviation', 'cement', 'steel'", - "lbk_match_success_rate", "matched", "character", "to be deprecated", "to be deprecated", - "lbk_match_success_rate", "match_n", "double", "Remaining outstanding loan value to the all companies in the sector that have some operations within the given region", "Numerical value greater or equal to 0", - "lbk_match_success_rate", "total_n", "integer", "Number of companies identified for analysis in the given region and sector. Any matched company is counted regardless of size of exposure", "Integer value greater or equal to 0", - "lbk_match_success_rate", "match_success_rate_rel", "integer", "Total number of companies in the reference dataset in the given region and sector", "Integer value greater or equal to 0", - "lbk_match_success_rate", "match_outstanding", "double", "Share of companies identified for analysis relative to total number of companies in the reference dataset. This is a proxy for which part of the economy of a region is covered by the analysis", "Numerical value between 0 and 1", - "lbk_match_success_rate", "total_outstanding", "double", "Sum of production in a sector and region by all companies identfied for analysis. The amount of production is not weighted by exposure", "Numerical value greater or equal to 0", - "lbk_match_success_rate", "match_success_outstanding_rel", "double", "Sum of production in a sector and region by all companies in the reference dataset", "Numerical value greater or equal to 0", - "lbk_match_success_rate", "match_credit_limit", "double", "Share of production of companies identified for analysis relative to production by all companies in the reference dataset. This is a proxy for how much of the output of a region is covered by the analysis", "Numerical value between 0 and 1", - "lbk_match_success_rate", "total_credit_limit", "double", "Sum of production in a sector and region by all companies in the reference dataset", "Numerical value greater or equal to 0", - "lbk_match_success_rate", "match_success_credit_limit_rel", "double", "Share of production of companies identified for analysis relative to production by all companies in the reference dataset. This is a proxy for how much of the output of a region is covered by the analysis", "Numerical value between 0 and 1" + "lbk_match_success_rate", "matched", "character", "Indicates if the matching values are shown for matched or unmatched loans", "Must be one of the following: 'Matched' or 'Not matched'", + "lbk_match_success_rate", "match_n", "integer", "Number of loans identified for analysis in a given sector in the given banking book that were successfully matched with companies in the production data", "Integer value greater or equal to 0", + "lbk_match_success_rate", "total_n", "integer", "Total number of loans in the banking book for a given sector", "Integer value greater or equal to 0", + "lbk_match_success_rate", "match_success_rate_rel", "double", "Share of matched loans in a secftor relative to total number of loans in the sector in the raw input banking book", "Numerical value between 0 and 1", + "lbk_match_success_rate", "match_outstanding", "double", "Remaining outstanding loan value in the banking book to the all matched companies in the sector", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "total_outstanding", "double", "Total outstanding loan value in the banking book in a given sector for matched and unmatched loans", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "match_success_outstanding_rel", "double", "Share of the matched outstanding loan amount in a sector relative to the total outstanding loan amount in that sector", "Numerical value between 0 and 1", + "lbk_match_success_rate", "match_credit_limit", "double", "Sum value of the credit limit of all matched loans within a sector", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "total_credit_limit", "double", "Total value of the credit limit of all loans matched or unmatched within a sector", "Numerical value greater or equal to 0", + "lbk_match_success_rate", "match_success_credit_limit_rel", "double", "Share of the matched amount of credit limit in a sector relative to the total credit limit in that sector", "Numerical value between 0 and 1" ) From 67c3508ac12a05d3f0a6d7adaba5fca513aa6966 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Mon, 2 Sep 2024 16:54:45 +0200 Subject: [PATCH 13/15] basic vignette for data_dictionary --- DESCRIPTION | 4 +- R/data.R | 16 ++++ R/sysdata.rda | Bin 461 -> 5433 bytes data-raw/data_dictionary.R | 5 +- data/data_dictionary.rda | Bin 0 -> 5433 bytes man/data_dictionary.Rd | 30 ++++++++ vignettes/data_dictionary.Rmd | 139 ++++++++++++++++++++++++++++++++++ 7 files changed, 192 insertions(+), 2 deletions(-) create mode 100644 R/data.R create mode 100644 data/data_dictionary.rda create mode 100644 man/data_dictionary.Rd create mode 100644 vignettes/data_dictionary.Rmd diff --git a/DESCRIPTION b/DESCRIPTION index 9989c0c6..8687a4b2 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -59,7 +59,8 @@ Suggests: rmarkdown, usethis, testthat (>= 3.0.0), - writexl + writexl, + DT Config/testthat/edition: 3 Roxygen: list(markdown = TRUE) Config/Needs/website: rmi-pacta/pacta.pkgdown.rmitemplate @@ -67,3 +68,4 @@ VignetteBuilder: knitr URL: https://rmi-pacta.github.io/workflow.multi.loanbook/, https://github.com/RMI-PACTA/workflow.multi.loanbook/ +LazyData: true diff --git a/R/data.R b/R/data.R new file mode 100644 index 00000000..c44a7559 --- /dev/null +++ b/R/data.R @@ -0,0 +1,16 @@ +#' Data dictionary +#' +#' An overview of the output data sets generated by the package, their data types, +#' and the definitions of the variables. +#' +#' @format ## `data_dictionary` +#' \describe{ +#' \item{dataset}{Name of the dataset} +#' \item{column}{Name of the column} +#' \item{typeof}{Data type of the column} +#' \item{definition}{Description of what the column stands for} +#' \item{value}{Which values are allowed for the column} +#' ... +#' } +#' @source internal +"data_dictionary" diff --git a/R/sysdata.rda b/R/sysdata.rda index 70f8e2a7c0bdd996932b5aa9775d8ebdb1555683..363def70a8e4ba87a4add3690836d8051c95c867 100644 GIT binary patch literal 5433 zcmV-96~^j9T4*^jL0KkKSxfR^G5{ZwfB*mg|F7=<{MG;e|KR`s|MS6M5JCe$h9H85 z00aa85CPyKJ_pbhDnLj8palRV0x&H=000DnN&oS+B?Gz|bW0g;iKnE(cWVlgxYDIkD?6Cf$3m?2MUCec4s^*ki? zG#VNJ00Tf89;4L600y2?fv*=P=Mh7iv=v0|#1k22%O$4MQB#a~xksV_~DIyV(Bq9W4AuLcc5}tvfe4FL(Z0BzN|HrNF z=RSvzCvQB>zTf1RLw{YiFIO^VGf;O>wdggry8@i3Z3}7K$dpONysb%bX}b$z37N8M zYU`U#+4QNX84fLbs6i>Upqo>hK`@d*-LrW!4~N7q@m;}QGwqb=~SqVh=HNl!c|N%o8N82sNr>-hWt94 zX}EQ@p|zxD><-h-gk1#KY8Ap_I~qEc2C8A86+_E^8^^E^%CLBq^8<0jE4m8NVjc`q z!HlwpOHt`sdQV3#6MD#PyRx{O&z{`deRXTfaZ9XlnX_%D;!X{@o6^fVtj=tjnwuMr z9e7iR+g!7uyTRVo8Zn<}{3_e;3>&;RT$hAmcbHtQtJ1lKj)QrFfuTKV{F~hB##!yQ z-5jOHe!OKm(|GSX(&r^&SyO^>44RoHLF=dmkl<}-xOO;FE!N3r^t5lmD2BBip`0~M zpm)y=k0mK4DGdO`WNMYc*}U9+)aA9y;odU z**8(G@@ewb%W2xg;(AA2dk>#iDm+cchW6>9>rS)BM;j)~nW4Y?qk*(-4eQ<7I6Pk6 znwvD~V+Z|B>9b6=ab9P2-1xgD7kc6HwMf{tn_MlMY{e^k-!!sBumwcDlBvBp=fAXd zRpp7Od`oSg&c^o{Oky35$N7W3mZU7^!|Hd&FR E=c^dIB^XA5(%cMN35G<2scgqWlaVnKEO~o zFV?bGMBdThxw7>>Gs4-la4oExd?!h_tnxQpvU>EME@uVgxh@XY_Z{a*(hofE-W)?vE|jc`7mt8BB18_z z|L6i=!Ln@GZA-jV3Q|{SaTn}tph>Zyl+9RT^tLGrWhfPNvrRg0IlA`kbZ@?!T-%)E zSG0f4H4hKD!QR}rTDi7|YSMTP2h^vab=t(@@pALu7(R6WDI$Bu3|2?i7`-ES;CkI| zgubY+Sjv~I>gi3cju>v)Z0Q;sM|ta8jvXeZuEcCOPqO?kdAdAD)!$o9Pr_~Gk0V;r zTeP>nE!|y>>zE6Pe(GRXqVP~udsD{xu9rtZ3ppU_x zhV$~*)zXOXC{d6dfY2OwzXA!UDvv5d|Tr zo<2kMoO7tqArVGa8Qx6>qKZwQ*dYiR?LhPreivqt3ox4#aF}jBQQl}W(xXKPXvn4! zAchw6AF42Q`E;MiCn4@B5v|c=*^1!#B3MO(F3PGQ;x;I$5W;K?96|x1>Lmb0S@yIb zBt$?uNFu6N;OiL^FAw=FRN}Ckqf2BrPvHWD2oND8?g{z+t&C~sH@a+6bzlevmBq7uxh#+E8L44sc-*v{ zqx&>?ue9WLovU>0SlaYsFEw`XC;an*X*b_V&#_I7wwD_A_O0oaJ&qH-Gr8!9Bg6(1 z`>W?(lW1VX-8-74-issMGG>DG>(!5is%4m8Ce~*MZkn4}}SBpUXh9>2d=znct?(zF+ zX-32{4hDri$o*yY(R>$?`RF>A-7-G3%au#a^>=U!yawyRu%4SXHRmcuk{usg{k# z(@dK!MlRJ&h~RNP+Im?!a5jvl(q%Mnhm`AcRe_U^m5BAHp#L~Bi`Jt_-aR`P;^e9L z(+L=2ccTix+`PW|4`Iry29){~?z*7&gFo|SJtG70*pKO>_S31}CA^rYvdW3QrgNN-orKF4(KFqgw>vK?3YFdC!0upq(Qo}Ct|ZUDl6XraI& zFbCCG(N@F**Av$S@dfLPU`>L=PGxy=Hj%3AnsIrwww#Yx_*KYi0~6yb8De5$ZL(UW z8Cb8jPELcVb6uw`YfQ*y1+c`*u?AwS4n_@9++=H{)l*EY8{{=BGGsD1%P=^yeL^Ov z7YwKeiR*O%>ZjXZQ96gk7J`4YaF0prZ4P7(0qw|;3cU+d?Zr7K*#ZwNhEd4-7A6*n zW}{R-n5UH5`(q&b>D)CqmX3d3L+(?&y+llLf$lHK?#|sNt$-ZW~O+wEZ$O3%J9Xi*cW`OD1nQF2TJuGlK;2)OlaeJ3B)pU6IVmb;?z(O|I13-yqh(xs1lru`;I=^_i1k=h*g+ zqiLblEMmBN_l_ynouf}QUQ8{Xn%E461tYO6gCE`vGV^1FCE#G%q(RXW-`kH!x+k};(X(ib62Fviu;z;PX71tPRC&38<&yZ zZ{F(;9all?NZyTf3{#Q2;(Pud3T+(GlHV%a=&w6fw90FUY8PS5UcEz9J{>Cdn$O=x z$+jlbOidE=Ri(5#9|E$f?Mvdiz(pbp;2nhRrH_!D=^T5J6Tk?I%#2l$ii~9zV=PlF zlQ6w0iv8mcHTX}r4CP;6k;4}Z6@T-wXl?d)+oS1HoiY#3oj43sG@C3wG~90&+e>i% zTPjYndh=yRGOZ-qiexXbC5P_Es($#`c(67`b(MR5CPU$pU91v(FY3lv$mtGLa#!xmqXgY?&$+O0SATMdipKC@QUc*AK}d>5hP(k9CIzjjUr;q}3K z%p*Rviz$-JA&jhsJtmsSWQJI3v4bjESvHr_@D2TDddE`Ouv&~ZqfwhF6!kk zkbP3YUm1z|*$3KQl#P2i&GOS1c@3@>lC~cfiH{3Dlp86;xrgV-C*N>mJXFcUb#O3Oyrxm(DZsq` z*Kg8d{%aHYQ~!B%7rK7OnIBsvTl>v>#@8^tM-$qY)mutVoeQbZm}Nf7I3UYRp@1Sa z9?1K2?*#c<`<&j_I6ZsN<_-iL$KJh%y?fE1_zK?Eq|tDeD&(c`rX=Q(!>#+)9VS0A z%xQlY^LRF%L%}@9Rd`Npe6E##UBl4D6BkKn*(UpBZN?KiX;xu&r)kW}Hnd-hvf7R2 zscO*EB-J-xqfp_BxEU*T#j7EfLusX}W)`hVGZOD2`A^qpUC-GND>ixe#?2zrEc7th*n6#QL1^?D2(-8J1h3^@V&7+$t#V~C)jg$Ea zgC{W850Y<3&Jy!z$EUb95EgmaR~guB&Pydx&5ACbA>;_#$)9dOQ2yd4#~c8S=V z7_zcx!KF7Q)Xd3ORudRWv8|-?WSXY+Wn$HZ%yJ(=iJ35EQM!I~&%9P9NszMqLn~CX zCIyqFKSea03-=0YO(wznG?z<8Ux_DA1tZ+%Me+`=L)?q{Qk{^yw;qE*`&*i}3`sPv zNgh^U!m?#i`xmm<+L$veg7FrrVd%7UR^gIxMU`#TjHAV9$&Cyc)fyU-{^HinqgB%s z*|wz08k!okn5;&HbsYAqdej@swBV01&XS#HjDHS>W}PGVvoVZM1E7COL+l@)W73Z` zN5Yfl=}cn-3}ox`jH?D*rZLSsd9{bMnFiUDDYNV;_0K9NUFno`D|Pr)3iyv^pcWS= zj#Wz`93c~cJ?O@y_9@Y{Tb>65e}a_B)CY{w7LHTi{ZDyux)B}99sfubQ|T$v_qe0< zpM;mzFt4d(n%1OQ8mn2Y8m45X7K=%vD=;RRlT9SV%vPbPH6@gtY?iWRlO{$OmeyG- zG#M*Y%~n$>jX-HRmfC(fes{pP8MyH?Bck*M##2WaYMC`O(q^WWkt-^ZNDBfHiZTP* z0b(;hSG6_3d*3;W5&H?Er{JIA)9y{D7xXXe zO>K4>Pt{)vybsXj`sn1=WIBwdOpKUUa`{?|`kXCvUtCBGVF%N8pw(Kf6nT(0DKO!l zN_xMsy0{Lv+Ya+$YPL)95vg#UgDWKY(^T+S`9FQ^2R7W6|l?%+}4DevR3i7TIdk1meWT%(1D0(m*f4R4|*NfGm_T z610;Q8VLclT{caZPIzw5(X?#E9VabIiKJ!>{-kqr7hXE2M^-!LvmEPVDWu-H;%2n- zi8oI9Su!lqJ4)=NZaO8}%rXykBRMj>kK0BmFN5dZhw9sKN;B`$-RlVH2)Y`e6XLQMm zWW|FrSjm=CC5ekEnN0`f+M7|j+*-0>ES-ZJrTd*KzgnFg)fts9pt(idL`M-o)(ROk z6RW>ZyVcq9w`CsjS9l&1YNncF5x6}ob0uM42>IEW20)P_MLW(hd{g10=OR6kPQoB{ z#cHSN;U}pn{0e=NbdR^CFYBjWQ{_K{85qh&lfQq2J&E&KSBOU`FD2)paZ&ws4>8d8 zy{yz?jH>yIAj&WA{Np;JpD}I>iIs^yl~yF?8V!>vwAz_bv}%0JKN(#srccLBQ;^c#*=I#z~T&XmcxS>_ULFxgZ05e9Q8hJE^%}`_^2%e_GXo2bg00x1h zKmY&$Ng}4n4D}O3$c8`-41+)ch-d>%G(AsZ#93ixQ9R^K;>}_XBr$q|MgQd&udHt4 zf~O4bh~#wM1QIGRy6?Ci$MpE$@cEviU;wPhL^wMNZ9q_@S5#yw+lquPbZ`q2uS=e2Sz2aX03fA zatjP#=*A8XT12i{tUZ|!`?d>4BU0+rBOxc(_K+xec(G1Jp^8mmE+~VX`gaS4V zHFF3d#20j@&{B$=j=?2LL~$tkl7Oitt6MOD$Z1HZ_|7s-8_fWi$f%JCR%S&S!G%|H zZJMs<_k7a*Ta%$OWf}t4;q`cP){KyHRZR`6DpI6tTHoSij^s-PpW^OFrwS4te+k0i DR9w$h diff --git a/data-raw/data_dictionary.R b/data-raw/data_dictionary.R index c87f8796..20eef7f5 100644 --- a/data-raw/data_dictionary.R +++ b/data-raw/data_dictionary.R @@ -355,4 +355,7 @@ data_dictionary <- dplyr::bind_rows( dd_lbk_match_success_rate ) -usethis::use_data(data_dictionary, overwrite = TRUE) +usethis::use_data( + data_dictionary, + overwrite = TRUE +) diff --git a/data/data_dictionary.rda b/data/data_dictionary.rda new file mode 100644 index 0000000000000000000000000000000000000000..363def70a8e4ba87a4add3690836d8051c95c867 GIT binary patch literal 5433 zcmV-96~^j9T4*^jL0KkKSxfR^G5{ZwfB*mg|F7=<{MG;e|KR`s|MS6M5JCe$h9H85 z00aa85CPyKJ_pbhDnLj8palRV0x&H=000DnN&oS+B?Gz|bW0g;iKnE(cWVlgxYDIkD?6Cf$3m?2MUCec4s^*ki? zG#VNJ00Tf89;4L600y2?fv*=P=Mh7iv=v0|#1k22%O$4MQB#a~xksV_~DIyV(Bq9W4AuLcc5}tvfe4FL(Z0BzN|HrNF z=RSvzCvQB>zTf1RLw{YiFIO^VGf;O>wdggry8@i3Z3}7K$dpONysb%bX}b$z37N8M zYU`U#+4QNX84fLbs6i>Upqo>hK`@d*-LrW!4~N7q@m;}QGwqb=~SqVh=HNl!c|N%o8N82sNr>-hWt94 zX}EQ@p|zxD><-h-gk1#KY8Ap_I~qEc2C8A86+_E^8^^E^%CLBq^8<0jE4m8NVjc`q z!HlwpOHt`sdQV3#6MD#PyRx{O&z{`deRXTfaZ9XlnX_%D;!X{@o6^fVtj=tjnwuMr z9e7iR+g!7uyTRVo8Zn<}{3_e;3>&;RT$hAmcbHtQtJ1lKj)QrFfuTKV{F~hB##!yQ z-5jOHe!OKm(|GSX(&r^&SyO^>44RoHLF=dmkl<}-xOO;FE!N3r^t5lmD2BBip`0~M zpm)y=k0mK4DGdO`WNMYc*}U9+)aA9y;odU z**8(G@@ewb%W2xg;(AA2dk>#iDm+cchW6>9>rS)BM;j)~nW4Y?qk*(-4eQ<7I6Pk6 znwvD~V+Z|B>9b6=ab9P2-1xgD7kc6HwMf{tn_MlMY{e^k-!!sBumwcDlBvBp=fAXd zRpp7Od`oSg&c^o{Oky35$N7W3mZU7^!|Hd&FR E=c^dIB^XA5(%cMN35G<2scgqWlaVnKEO~o zFV?bGMBdThxw7>>Gs4-la4oExd?!h_tnxQpvU>EME@uVgxh@XY_Z{a*(hofE-W)?vE|jc`7mt8BB18_z z|L6i=!Ln@GZA-jV3Q|{SaTn}tph>Zyl+9RT^tLGrWhfPNvrRg0IlA`kbZ@?!T-%)E zSG0f4H4hKD!QR}rTDi7|YSMTP2h^vab=t(@@pALu7(R6WDI$Bu3|2?i7`-ES;CkI| zgubY+Sjv~I>gi3cju>v)Z0Q;sM|ta8jvXeZuEcCOPqO?kdAdAD)!$o9Pr_~Gk0V;r zTeP>nE!|y>>zE6Pe(GRXqVP~udsD{xu9rtZ3ppU_x zhV$~*)zXOXC{d6dfY2OwzXA!UDvv5d|Tr zo<2kMoO7tqArVGa8Qx6>qKZwQ*dYiR?LhPreivqt3ox4#aF}jBQQl}W(xXKPXvn4! zAchw6AF42Q`E;MiCn4@B5v|c=*^1!#B3MO(F3PGQ;x;I$5W;K?96|x1>Lmb0S@yIb zBt$?uNFu6N;OiL^FAw=FRN}Ckqf2BrPvHWD2oND8?g{z+t&C~sH@a+6bzlevmBq7uxh#+E8L44sc-*v{ zqx&>?ue9WLovU>0SlaYsFEw`XC;an*X*b_V&#_I7wwD_A_O0oaJ&qH-Gr8!9Bg6(1 z`>W?(lW1VX-8-74-issMGG>DG>(!5is%4m8Ce~*MZkn4}}SBpUXh9>2d=znct?(zF+ zX-32{4hDri$o*yY(R>$?`RF>A-7-G3%au#a^>=U!yawyRu%4SXHRmcuk{usg{k# z(@dK!MlRJ&h~RNP+Im?!a5jvl(q%Mnhm`AcRe_U^m5BAHp#L~Bi`Jt_-aR`P;^e9L z(+L=2ccTix+`PW|4`Iry29){~?z*7&gFo|SJtG70*pKO>_S31}CA^rYvdW3QrgNN-orKF4(KFqgw>vK?3YFdC!0upq(Qo}Ct|ZUDl6XraI& zFbCCG(N@F**Av$S@dfLPU`>L=PGxy=Hj%3AnsIrwww#Yx_*KYi0~6yb8De5$ZL(UW z8Cb8jPELcVb6uw`YfQ*y1+c`*u?AwS4n_@9++=H{)l*EY8{{=BGGsD1%P=^yeL^Ov z7YwKeiR*O%>ZjXZQ96gk7J`4YaF0prZ4P7(0qw|;3cU+d?Zr7K*#ZwNhEd4-7A6*n zW}{R-n5UH5`(q&b>D)CqmX3d3L+(?&y+llLf$lHK?#|sNt$-ZW~O+wEZ$O3%J9Xi*cW`OD1nQF2TJuGlK;2)OlaeJ3B)pU6IVmb;?z(O|I13-yqh(xs1lru`;I=^_i1k=h*g+ zqiLblEMmBN_l_ynouf}QUQ8{Xn%E461tYO6gCE`vGV^1FCE#G%q(RXW-`kH!x+k};(X(ib62Fviu;z;PX71tPRC&38<&yZ zZ{F(;9all?NZyTf3{#Q2;(Pud3T+(GlHV%a=&w6fw90FUY8PS5UcEz9J{>Cdn$O=x z$+jlbOidE=Ri(5#9|E$f?Mvdiz(pbp;2nhRrH_!D=^T5J6Tk?I%#2l$ii~9zV=PlF zlQ6w0iv8mcHTX}r4CP;6k;4}Z6@T-wXl?d)+oS1HoiY#3oj43sG@C3wG~90&+e>i% zTPjYndh=yRGOZ-qiexXbC5P_Es($#`c(67`b(MR5CPU$pU91v(FY3lv$mtGLa#!xmqXgY?&$+O0SATMdipKC@QUc*AK}d>5hP(k9CIzjjUr;q}3K z%p*Rviz$-JA&jhsJtmsSWQJI3v4bjESvHr_@D2TDddE`Ouv&~ZqfwhF6!kk zkbP3YUm1z|*$3KQl#P2i&GOS1c@3@>lC~cfiH{3Dlp86;xrgV-C*N>mJXFcUb#O3Oyrxm(DZsq` z*Kg8d{%aHYQ~!B%7rK7OnIBsvTl>v>#@8^tM-$qY)mutVoeQbZm}Nf7I3UYRp@1Sa z9?1K2?*#c<`<&j_I6ZsN<_-iL$KJh%y?fE1_zK?Eq|tDeD&(c`rX=Q(!>#+)9VS0A z%xQlY^LRF%L%}@9Rd`Npe6E##UBl4D6BkKn*(UpBZN?KiX;xu&r)kW}Hnd-hvf7R2 zscO*EB-J-xqfp_BxEU*T#j7EfLusX}W)`hVGZOD2`A^qpUC-GND>ixe#?2zrEc7th*n6#QL1^?D2(-8J1h3^@V&7+$t#V~C)jg$Ea zgC{W850Y<3&Jy!z$EUb95EgmaR~guB&Pydx&5ACbA>;_#$)9dOQ2yd4#~c8S=V z7_zcx!KF7Q)Xd3ORudRWv8|-?WSXY+Wn$HZ%yJ(=iJ35EQM!I~&%9P9NszMqLn~CX zCIyqFKSea03-=0YO(wznG?z<8Ux_DA1tZ+%Me+`=L)?q{Qk{^yw;qE*`&*i}3`sPv zNgh^U!m?#i`xmm<+L$veg7FrrVd%7UR^gIxMU`#TjHAV9$&Cyc)fyU-{^HinqgB%s z*|wz08k!okn5;&HbsYAqdej@swBV01&XS#HjDHS>W}PGVvoVZM1E7COL+l@)W73Z` zN5Yfl=}cn-3}ox`jH?D*rZLSsd9{bMnFiUDDYNV;_0K9NUFno`D|Pr)3iyv^pcWS= zj#Wz`93c~cJ?O@y_9@Y{Tb>65e}a_B)CY{w7LHTi{ZDyux)B}99sfubQ|T$v_qe0< zpM;mzFt4d(n%1OQ8mn2Y8m45X7K=%vD=;RRlT9SV%vPbPH6@gtY?iWRlO{$OmeyG- zG#M*Y%~n$>jX-HRmfC(fes{pP8MyH?Bck*M##2WaYMC`O(q^WWkt-^ZNDBfHiZTP* z0b(;hSG6_3d*3;W5&H?Er{JIA)9y{D7xXXe zO>K4>Pt{)vybsXj`sn1=WIBwdOpKUUa`{?|`kXCvUtCBGVF%N8pw(Kf6nT(0DKO!l zN_xMsy0{Lv+Ya+$YPL)95vg#UgDWKY(^T+S`9FQ^2R7W6|l?%+}4DevR3i7TIdk1meWT%(1D0(m*f4R4|*NfGm_T z610;Q8VLclT{caZPIzw5(X?#E9VabIiKJ!>{-kqr7hXE2M^-!LvmEPVDWu-H;%2n- zi8oI9Su!lqJ4)=NZaO8}%rXykBRMj>kK0BmFN5dZhw9sKN;B`$-RlVH2)Y`e6XLQMm zWW|FrSjm=CC5ekEnN0`f+M7|j+*-0>ES-ZJrTd*KzgnFg)fts9pt(idL`M-o)(ROk z6RW>ZyVcq9w`CsjS9l&1YNncF5x6}ob0uM42>IEW20)P_MLW(hd{g10=OR6kPQoB{ z#cHSN;U}pn{0e=NbdR^CFYBjWQ{_K{85qh&lfQq2J&E&KSBOU`FD2)paZ&ws4>8d8 zy{yz?jH>yIAj&WA{Np;JpD}I>iIs^yl~yF?8V!>vwAz_bv}%0JKN(#srccLBQ;^c#*=I#z~T&Xmcx + %\VignetteIndexEntry{data_dictionary} + %\VignetteEngine{knitr::rmarkdown} + %\VignetteEncoding{UTF-8} +--- + +```{r, include = FALSE} +knitr::opts_chunk$set( + collapse = TRUE, + comment = "#>" +) +``` + +```{r setup} +library(workflow.multi.loanbook) +``` +# Intro + +In many cases, users of this package will want to use the outputs of the analyses for further processing, such as additional analyses or making visualizations based on the design guide of their own organisation. To facilitate such additional use cases, but also simplify interpretation of the outputs generated with this package, this data dictionary documents each type of output table in detail, focusing on data types and definitions. + +This article is structured based on the output tables generated by `workflow.multi.loanbook` and follows the standard flow of the user experience as much as possible, so it can be read in the same sequence as the analysis is run. + +# Tables + +The main steps that generate output tables are: + +* Diagnostics and coverage +* Standard PACTA analysis +* Aggregated PACTA metrics + +## Diagnostics + +The diagnostics section is split into determining the match success rate of the loan books analysed and inspecting the real economy activity related to the financing made by the banks through the matched loan books. The former is influenced by the quality of the input loan book data and the completeness of the reference production data against which the loan books are matched. The latter, while it depends on a solid match success rate, is mainly driven by the financing decisions and the portfolio allocation made by the banks. + +### Match success rate + +```{r dd_lbk_match_success_rate} +dd_lbk_match_success_rate <- dplyr::filter(data_dictionary, .data[["dataset"]] == "lbk_match_success_rate") +DT::datatable(dd_lbk_match_success_rate) + +``` + +### Loan book coverage + +```{r dd_summary_statistics_loanbook_coverage} +dd_summary_statistics_loanbook_coverage <- dplyr::filter(data_dictionary, .data[["dataset"]] == "summary_statistics_loanbook_coverage") +DT::datatable(dd_summary_statistics_loanbook_coverage) + +``` + +## Standard PACTA analysis + +The standard PACTA analysis is run across all input banking books, but produces the same output metrics as known from the `r2dii.*` packages. Results are given at portfolio level grouped by banking book. Beyond the standard output format, tables are provided that can be used as input for visualizations, for each of the standard sectors and technologies. + +### Target Market Share results (all groups) + +Target market share results at the portfolio level for each included banking book + +```{r dd_tms_results_all_groups} +dd_tms_results_all_groups <- dplyr::filter(data_dictionary, .data[["dataset"]] == "tms_results_all_groups") +DT::datatable(dd_tms_results_all_groups) + +``` + + +### Sectoral Decarbonization Approach results (all groups) + +SDA results at the portfolio level for each included banking book + +```{r dd_sda_results_all_groups} +dd_sda_results_all_groups <- dplyr::filter(data_dictionary, .data[["dataset"]] == "sda_results_all_groups") +DT::datatable(dd_sda_results_all_groups) + +``` + + +### Data tech mix + +Results for a given portfolio and sector, tailored to be used in the tech mix chart + +```{r dd_data_tech_mix} +dd_data_tech_mix <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_tech_mix") +DT::datatable(dd_data_tech_mix) + +``` + + +### Data trajectory + +Results for a given portfolio, sector and technology, tailored to be used in the volume trajectory chart + +```{r dd_data_trajectory} +dd_data_trajectory <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_trajectory") +DT::datatable(dd_data_trajectory) + +``` + + +### Data emission intensity + +Results for a given portfolio and sector, tailored to be used in the emission intensity chart + +```{r dd_data_emission_intensity} +dd_data_emission_intensity <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_trajectory") +DT::datatable(dd_data_emission_intensity) + +``` + + +### Companies included + +Lists all companies including exposures, that were analysed for the given loan book and that are therefore included in the data to be visualized. + +```{r dd_companies_included} +dd_companies_included <- dplyr::filter(data_dictionary, .data[["dataset"]] == "companies_included") +DT::datatable(dd_companies_included) + +``` + + +## Aggregated PACTA metrics + +dd_company_technology_deviation_tms, + dd_company_alignment_net_tms, + dd_company_alignment_bo_po_tms, + dd_company_alignment_net_sda, + dd_company_exposure_bo_po_aggregate_alignment, + dd_company_exposure_net_aggregate_alignment, + dd_loanbook_exposure_bo_po_aggregate_alignment, + dd_loanbook_exposure_net_aggregate_alignment, + dd_data_sankey, + dd_data_scatter_alignment_exposure, + dd_data_scatter_sector, + dd_data_scatter_sector_animated, + dd_data_timeline_net, + dd_data_timeline_bo_po From aa4ac225d1f04a72be043f3f9feb9b9dcf75ee31 Mon Sep 17 00:00:00 2001 From: jacobvjk Date: Tue, 3 Sep 2024 15:12:54 +0200 Subject: [PATCH 14/15] update sysdata.rda --- R/sysdata.rda | Bin 5433 -> 470 bytes 1 file changed, 0 insertions(+), 0 deletions(-) diff --git a/R/sysdata.rda b/R/sysdata.rda index 363def70a8e4ba87a4add3690836d8051c95c867..0f6a68795e7d26436c75db9b29a023008ed884d9 100644 GIT binary patch literal 470 zcmV;{0V)1MT4*^jL0KkKSx)F#GhY9+8=<45mbxH8Ob<2-DOUhMHj- zXvAazki=*Jl2I_4o}Qw5hCt8&8UPIqH1!PwX#jejUkN0Ho|hfPk`i!m|b(c53&6mPtg4@s8|3jG7#<#!Lw=!$V8MMAroR$<`%X0 zf=Wd1XrC~dtRMjhAchDA0f2d=WIo9PW&|Uep}UQ9%N# zD}jN|3<32E6p;s*a?APg%B>2;m#|ryxfCicq?{`0Y35^&84YNLw~Pf+)Jd8S$)L_~ zbq^%aFNB6aa&$YZ(7>i_@% literal 5433 zcmV-96~^j9T4*^jL0KkKSxfR^G5{ZwfB*mg|F7=<{MG;e|KR`s|MS6M5JCe$h9H85 z00aa85CPyKJ_pbhDnLj8palRV0x&H=000DnN&oS+B?Gz|bW0g;iKnE(cWVlgxYDIkD?6Cf$3m?2MUCec4s^*ki? zG#VNJ00Tf89;4L600y2?fv*=P=Mh7iv=v0|#1k22%O$4MQB#a~xksV_~DIyV(Bq9W4AuLcc5}tvfe4FL(Z0BzN|HrNF z=RSvzCvQB>zTf1RLw{YiFIO^VGf;O>wdggry8@i3Z3}7K$dpONysb%bX}b$z37N8M zYU`U#+4QNX84fLbs6i>Upqo>hK`@d*-LrW!4~N7q@m;}QGwqb=~SqVh=HNl!c|N%o8N82sNr>-hWt94 zX}EQ@p|zxD><-h-gk1#KY8Ap_I~qEc2C8A86+_E^8^^E^%CLBq^8<0jE4m8NVjc`q z!HlwpOHt`sdQV3#6MD#PyRx{O&z{`deRXTfaZ9XlnX_%D;!X{@o6^fVtj=tjnwuMr z9e7iR+g!7uyTRVo8Zn<}{3_e;3>&;RT$hAmcbHtQtJ1lKj)QrFfuTKV{F~hB##!yQ z-5jOHe!OKm(|GSX(&r^&SyO^>44RoHLF=dmkl<}-xOO;FE!N3r^t5lmD2BBip`0~M zpm)y=k0mK4DGdO`WNMYc*}U9+)aA9y;odU z**8(G@@ewb%W2xg;(AA2dk>#iDm+cchW6>9>rS)BM;j)~nW4Y?qk*(-4eQ<7I6Pk6 znwvD~V+Z|B>9b6=ab9P2-1xgD7kc6HwMf{tn_MlMY{e^k-!!sBumwcDlBvBp=fAXd zRpp7Od`oSg&c^o{Oky35$N7W3mZU7^!|Hd&FR E=c^dIB^XA5(%cMN35G<2scgqWlaVnKEO~o zFV?bGMBdThxw7>>Gs4-la4oExd?!h_tnxQpvU>EME@uVgxh@XY_Z{a*(hofE-W)?vE|jc`7mt8BB18_z z|L6i=!Ln@GZA-jV3Q|{SaTn}tph>Zyl+9RT^tLGrWhfPNvrRg0IlA`kbZ@?!T-%)E zSG0f4H4hKD!QR}rTDi7|YSMTP2h^vab=t(@@pALu7(R6WDI$Bu3|2?i7`-ES;CkI| zgubY+Sjv~I>gi3cju>v)Z0Q;sM|ta8jvXeZuEcCOPqO?kdAdAD)!$o9Pr_~Gk0V;r zTeP>nE!|y>>zE6Pe(GRXqVP~udsD{xu9rtZ3ppU_x zhV$~*)zXOXC{d6dfY2OwzXA!UDvv5d|Tr zo<2kMoO7tqArVGa8Qx6>qKZwQ*dYiR?LhPreivqt3ox4#aF}jBQQl}W(xXKPXvn4! zAchw6AF42Q`E;MiCn4@B5v|c=*^1!#B3MO(F3PGQ;x;I$5W;K?96|x1>Lmb0S@yIb zBt$?uNFu6N;OiL^FAw=FRN}Ckqf2BrPvHWD2oND8?g{z+t&C~sH@a+6bzlevmBq7uxh#+E8L44sc-*v{ zqx&>?ue9WLovU>0SlaYsFEw`XC;an*X*b_V&#_I7wwD_A_O0oaJ&qH-Gr8!9Bg6(1 z`>W?(lW1VX-8-74-issMGG>DG>(!5is%4m8Ce~*MZkn4}}SBpUXh9>2d=znct?(zF+ zX-32{4hDri$o*yY(R>$?`RF>A-7-G3%au#a^>=U!yawyRu%4SXHRmcuk{usg{k# z(@dK!MlRJ&h~RNP+Im?!a5jvl(q%Mnhm`AcRe_U^m5BAHp#L~Bi`Jt_-aR`P;^e9L z(+L=2ccTix+`PW|4`Iry29){~?z*7&gFo|SJtG70*pKO>_S31}CA^rYvdW3QrgNN-orKF4(KFqgw>vK?3YFdC!0upq(Qo}Ct|ZUDl6XraI& zFbCCG(N@F**Av$S@dfLPU`>L=PGxy=Hj%3AnsIrwww#Yx_*KYi0~6yb8De5$ZL(UW z8Cb8jPELcVb6uw`YfQ*y1+c`*u?AwS4n_@9++=H{)l*EY8{{=BGGsD1%P=^yeL^Ov z7YwKeiR*O%>ZjXZQ96gk7J`4YaF0prZ4P7(0qw|;3cU+d?Zr7K*#ZwNhEd4-7A6*n zW}{R-n5UH5`(q&b>D)CqmX3d3L+(?&y+llLf$lHK?#|sNt$-ZW~O+wEZ$O3%J9Xi*cW`OD1nQF2TJuGlK;2)OlaeJ3B)pU6IVmb;?z(O|I13-yqh(xs1lru`;I=^_i1k=h*g+ zqiLblEMmBN_l_ynouf}QUQ8{Xn%E461tYO6gCE`vGV^1FCE#G%q(RXW-`kH!x+k};(X(ib62Fviu;z;PX71tPRC&38<&yZ zZ{F(;9all?NZyTf3{#Q2;(Pud3T+(GlHV%a=&w6fw90FUY8PS5UcEz9J{>Cdn$O=x z$+jlbOidE=Ri(5#9|E$f?Mvdiz(pbp;2nhRrH_!D=^T5J6Tk?I%#2l$ii~9zV=PlF zlQ6w0iv8mcHTX}r4CP;6k;4}Z6@T-wXl?d)+oS1HoiY#3oj43sG@C3wG~90&+e>i% zTPjYndh=yRGOZ-qiexXbC5P_Es($#`c(67`b(MR5CPU$pU91v(FY3lv$mtGLa#!xmqXgY?&$+O0SATMdipKC@QUc*AK}d>5hP(k9CIzjjUr;q}3K z%p*Rviz$-JA&jhsJtmsSWQJI3v4bjESvHr_@D2TDddE`Ouv&~ZqfwhF6!kk zkbP3YUm1z|*$3KQl#P2i&GOS1c@3@>lC~cfiH{3Dlp86;xrgV-C*N>mJXFcUb#O3Oyrxm(DZsq` z*Kg8d{%aHYQ~!B%7rK7OnIBsvTl>v>#@8^tM-$qY)mutVoeQbZm}Nf7I3UYRp@1Sa z9?1K2?*#c<`<&j_I6ZsN<_-iL$KJh%y?fE1_zK?Eq|tDeD&(c`rX=Q(!>#+)9VS0A z%xQlY^LRF%L%}@9Rd`Npe6E##UBl4D6BkKn*(UpBZN?KiX;xu&r)kW}Hnd-hvf7R2 zscO*EB-J-xqfp_BxEU*T#j7EfLusX}W)`hVGZOD2`A^qpUC-GND>ixe#?2zrEc7th*n6#QL1^?D2(-8J1h3^@V&7+$t#V~C)jg$Ea zgC{W850Y<3&Jy!z$EUb95EgmaR~guB&Pydx&5ACbA>;_#$)9dOQ2yd4#~c8S=V z7_zcx!KF7Q)Xd3ORudRWv8|-?WSXY+Wn$HZ%yJ(=iJ35EQM!I~&%9P9NszMqLn~CX zCIyqFKSea03-=0YO(wznG?z<8Ux_DA1tZ+%Me+`=L)?q{Qk{^yw;qE*`&*i}3`sPv zNgh^U!m?#i`xmm<+L$veg7FrrVd%7UR^gIxMU`#TjHAV9$&Cyc)fyU-{^HinqgB%s z*|wz08k!okn5;&HbsYAqdej@swBV01&XS#HjDHS>W}PGVvoVZM1E7COL+l@)W73Z` zN5Yfl=}cn-3}ox`jH?D*rZLSsd9{bMnFiUDDYNV;_0K9NUFno`D|Pr)3iyv^pcWS= zj#Wz`93c~cJ?O@y_9@Y{Tb>65e}a_B)CY{w7LHTi{ZDyux)B}99sfubQ|T$v_qe0< zpM;mzFt4d(n%1OQ8mn2Y8m45X7K=%vD=;RRlT9SV%vPbPH6@gtY?iWRlO{$OmeyG- zG#M*Y%~n$>jX-HRmfC(fes{pP8MyH?Bck*M##2WaYMC`O(q^WWkt-^ZNDBfHiZTP* z0b(;hSG6_3d*3;W5&H?Er{JIA)9y{D7xXXe zO>K4>Pt{)vybsXj`sn1=WIBwdOpKUUa`{?|`kXCvUtCBGVF%N8pw(Kf6nT(0DKO!l zN_xMsy0{Lv+Ya+$YPL)95vg#UgDWKY(^T+S`9FQ^2R7W6|l?%+}4DevR3i7TIdk1meWT%(1D0(m*f4R4|*NfGm_T z610;Q8VLclT{caZPIzw5(X?#E9VabIiKJ!>{-kqr7hXE2M^-!LvmEPVDWu-H;%2n- zi8oI9Su!lqJ4)=NZaO8}%rXykBRMj>kK0BmFN5dZhw9sKN;B`$-RlVH2)Y`e6XLQMm zWW|FrSjm=CC5ekEnN0`f+M7|j+*-0>ES-ZJrTd*KzgnFg)fts9pt(idL`M-o)(ROk z6RW>ZyVcq9w`CsjS9l&1YNncF5x6}ob0uM42>IEW20)P_MLW(hd{g10=OR6kPQoB{ z#cHSN;U}pn{0e=NbdR^CFYBjWQ{_K{85qh&lfQq2J&E&KSBOU`FD2)paZ&ws4>8d8 zy{yz?jH>yIAj&WA{Np;JpD}I>iIs^yl~yF?8V!>vwAz_bv}%0JKN(#srccLBQ;^c#*=I#z~T&Xmcx Date: Wed, 4 Sep 2024 11:39:03 +0200 Subject: [PATCH 15/15] complete info in data_dictionary vignette --- vignettes/data_dictionary.Rmd | 156 +++++++++++++++++++++++++++++++--- 1 file changed, 142 insertions(+), 14 deletions(-) diff --git a/vignettes/data_dictionary.Rmd b/vignettes/data_dictionary.Rmd index 135a8ca9..d9a0bdda 100644 --- a/vignettes/data_dictionary.Rmd +++ b/vignettes/data_dictionary.Rmd @@ -123,17 +123,145 @@ DT::datatable(dd_companies_included) ## Aggregated PACTA metrics -dd_company_technology_deviation_tms, - dd_company_alignment_net_tms, - dd_company_alignment_bo_po_tms, - dd_company_alignment_net_sda, - dd_company_exposure_bo_po_aggregate_alignment, - dd_company_exposure_net_aggregate_alignment, - dd_loanbook_exposure_bo_po_aggregate_alignment, - dd_loanbook_exposure_net_aggregate_alignment, - dd_data_sankey, - dd_data_scatter_alignment_exposure, - dd_data_scatter_sector, - dd_data_scatter_sector_animated, - dd_data_timeline_net, - dd_data_timeline_bo_po +The aggregated PACTA metrics are also run across all input banking books. The calculations produce the net aggregate alignment metric, which is defined in `pacta.multi.loanbook.analysis` and allows producing the corresponding plots using `pacta.multi.loanbook.plot`. Results are grouped at the level defined by the `by_group` parameter. + +### Company technology deviation + +For each company in the analyzed banking books, shows the deviation of the technology build-out in the final year of the analysis from the corresponding allocated scenario value. This is an intermediate result that is further processed in the calculation of the net aggregate alignment metric. Only available for sectors, which have technology level calculations using the target market share, namely `automotive, coal, oil and gas, power`. + +```{r dd_company_technology_deviation_tms} +dd_company_technology_deviation_tms <- dplyr::filter(data_dictionary, .data[["dataset"]] == "company_technology_deviation_tms") +DT::datatable(dd_company_technology_deviation_tms) + +``` + +### Company net alignment metric for TMS sectors + +For each company in the analyzed banking books, shows the net aggregate alignment metric for sectors, which have technology level calculations using the target market share, namely `automotive, coal, oil and gas, power`. See the [`pacta.multi.loanbook.analysis` wensite](https://rmi-pacta.github.io/pacta.multi.loanbook.analysis/articles/company_alignment_metric.html) for methodological documentation. + +```{r dd_company_alignment_net_tms} +dd_company_alignment_net_tms <- dplyr::filter(data_dictionary, .data[["dataset"]] == "company_alignment_net_tms") +DT::datatable(dd_company_alignment_net_tms) + +``` + +### Disaggregated company buildout/phaseout alignment metric for TMS sectors + +For each company in the analyzed banking books, shows the aggregate alignment metric - disaggregated into its buildout and phaseout components - for sectors, which have technology level calculations using the target market share, namely `automotive, coal, oil and gas, power`. See the [`pacta.multi.loanbook.analysis` wensite](https://rmi-pacta.github.io/pacta.multi.loanbook.analysis/articles/company_alignment_metric.html) for methodological documentation. + +```{r dd_company_alignment_bo_po_tms} +dd_company_alignment_bo_po_tms <- dplyr::filter(data_dictionary, .data[["dataset"]] == "company_alignment_bo_po_tms") +DT::datatable(dd_company_alignment_bo_po_tms) + +``` + +### Company net alignment metric for SDA sectors + +For each company in the analyzed banking books, shows the net aggregate alignment metric for sectors, which have sector level calculations using the sectoral decarbonization approach (SDA), namely `aviation, cement, steel`. See the [`pacta.multi.loanbook.analysis` wensite](https://rmi-pacta.github.io/pacta.multi.loanbook.analysis/articles/company_alignment_metric.html) for methodological documentation. + +```{r dd_company_alignment_net_sda} +dd_company_alignment_net_sda <- dplyr::filter(data_dictionary, .data[["dataset"]] == "company_alignment_net_sda") +DT::datatable(dd_company_alignment_net_sda) + +``` + +### Company net aggregate alignment metric with financial exposures + +For each company in the analyzed banking books, shows the net aggregate alignment metric for all available sectors. This table includes the financial exposure to each of the analyzed parts of the banking books, split as defined in `by_group`. + +```{r dd_company_exposure_net_aggregate_alignment} +dd_company_exposure_net_aggregate_alignment <- dplyr::filter(data_dictionary, .data[["dataset"]] == "company_exposure_net_aggregate_alignment") +DT::datatable(dd_company_exposure_net_aggregate_alignment) + +``` + +### Disaggregated company buildout/phaseout alignment metric with financial exposures + +For each company in the analyzed banking books, shows the net aggregate alignment metric - disaggregated by its buildout and phaseout components - for all sectors that use technology level TMS calculations, namely `automotive, coal, oil and gas, power`. This table includes the financial exposure to each of the analyzed parts of the banking books, split as defined in `by_group`. Note that the financial exposure is not disaggregated, the alignment metric is. + +```{r dd_company_exposure_bo_po_aggregate_alignment} +dd_company_exposure_bo_po_aggregate_alignment <- dplyr::filter(data_dictionary, .data[["dataset"]] == "company_exposure_bo_po_aggregate_alignment") +DT::datatable(dd_company_exposure_bo_po_aggregate_alignment) + +``` + +### Loan book net aggregate alignment metric with financial exposures + +For each loan book level group (split as defined in `by_group`), shows the net aggregate alignment metric for all available sectors. This table includes the financial exposure to each of the analyzed parts of the banking books. Company level results are aggregated to the loan book level, using their relative financial exposure as weights. + +```{r dd_loanbook_exposure_net_aggregate_alignment} +dd_loanbook_exposure_net_aggregate_alignment <- dplyr::filter(data_dictionary, .data[["dataset"]] == "loanbook_exposure_net_aggregate_alignment") +DT::datatable(dd_loanbook_exposure_net_aggregate_alignment) + +``` + +### Disaggregated loan book buildout/phaseout alignment metric with financial exposures + +For each loan book level group (split as defined in `by_group`), shows the net aggregate alignment metric - disaggregated by its buildout and phaseout components - for all sectors using technology level TMS calculations, namely `automotive, coal, oil and gas, power`. Company level results are aggregated to the loan book level, using their relative financial exposure as weights. + +```{r dd_loanbook_exposure_bo_po_aggregate_alignment} +dd_loanbook_exposure_bo_po_aggregate_alignment <- dplyr::filter(data_dictionary, .data[["dataset"]] == "loanbook_exposure_bo_po_aggregate_alignment") +DT::datatable(dd_loanbook_exposure_bo_po_aggregate_alignment) + +``` + +### Input data for Sankey plot + +Data set meant to be used as input into `pacta.multi.loanbook.plot::plot_sankey()`. + +```{r dd_data_sankey} +dd_data_sankey <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_sankey") +DT::datatable(dd_data_sankey) + +``` + +### Input data for alignment-by-exposure scatter plot + +Data set meant to be used as input into `pacta.multi.loanbook.plot::plot_scatter_alignment_exposure()`. + +```{r dd_data_scatter_alignment_exposure} +dd_data_scatter_alignment_exposure <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_scatter_alignment_exposure") +DT::datatable(dd_data_scatter_alignment_exposure) + +``` + +### Input data for buildout/phaseout scatter plot + +Data set meant to be used as input into `pacta.multi.loanbook.plot::plot_scatter()`. + +```{r dd_data_scatter_sector} +dd_data_scatter_sector <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_scatter_sector") +DT::datatable(dd_data_scatter_sector) + +``` + +### Input data for animated buildout/phaseout scatter plot + +Data set meant to be used as input into `pacta.multi.loanbook.plot::plot_scatter_animated()`. + +```{r dd_data_scatter_sector_animated} +dd_data_scatter_sector_animated <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_scatter_sector_animated") +DT::datatable(dd_data_scatter_sector_animated) + +``` + +### Input data for net timline plot + +Data set meant to be used as input into `pacta.multi.loanbook.plot::plot_timeline()`. + +```{r dd_data_timeline_net} +dd_data_timeline_net <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_timeline_net") +DT::datatable(dd_data_timeline_net) + +``` + +### Input data for buildout/phaseout timline plot + +Data set meant to be used as input into `pacta.multi.loanbook.plot::plot_timeline()`. + +```{r dd_data_timeline_bo_po} +dd_data_timeline_bo_po <- dplyr::filter(data_dictionary, .data[["dataset"]] == "data_timeline_bo_po") +DT::datatable(dd_data_timeline_bo_po) + +``` +