-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.yml
188 lines (176 loc) · 14.8 KB
/
config.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
default:
data_prep_outputs_path: "" # a single, absolute or relative path to a directory where the outputs will be saved
asset_impact_data_path: "" # a single, absolute or relative path to a directory that contains the AI inputs (can be the same as `factset_data_path` and/or `sceanrios_data_path`)
factset_data_path: "" # a single, absolute or relative path to a directory that contains the FactSet inputs (can be the same as `asset_impact_data_path` and/or `scenarios_data_path`)
scenarios_data_path: "" # a single, absolute or relative path to a directory that contains the scenario inputs (can be the same as `asset_impact_data_path` and/or `factset_data_path`)
preflight_data_path: "" # a single, absolute or relative path to a directory that contains a previous "currencies.rds" file and/or will be used to save a copy of pre-flight data files generated on-the-fly (by default [""], this is set the same path as `data_prep_outputs_path`)
masterdata_ownership_filename: "" # a single filename of the intended masterdata_ownership CSV (must exist in the `asset_impact_data_path` directory)
masterdata_debt_filename: "" # a single filename of the intended masterdata_debt CSV (must exist in the `asset_impact_data_path` directory)
ar_company_id__factset_entity_id_filename: "" # a single filename of the intended ar_company_id__factset_entity_id CSV (must exist in the `asset_impact_data_path` directory)
factset_financial_data_filename: "" # a single filename of the intended factset_financial_data RDS (must exist in the `factset_data_path` directory)
factset_entity_info_filename: "" # a single filename of the intended factset_entity_info RDS (must exist in the `factset_data_path` directory)
factset_entity_financing_data_filename: "" # a single filename of the intended factset_entity_financing_data RDS (must exist in the `factset_data_path` directory)
factset_fund_data_filename: "" # a single filename of the intended factset_fund_data RDS (must exist in the `factset_data_path` directory)
factset_isin_to_fund_table_filename: "" # a single filename of the intended factset_isin_to_fund_table RDS (must exist in the `factset_data_path` directory)
factset_iss_emissions_data_filename: "" # a single filename of the intended factset_iss_emissions_data RDS (must exist in the `factset_data_path` directory)
factset_issue_code_bridge_filename: "" # a single filename of the intended factset_issue_code_bridge RDS (must exist in the `factset_data_path` directory)
factset_industry_map_bridge_filename: "" # a single filename of the intended factset_industry_map_bridge RDS (must exist in the `factset_data_path` directory)
factset_manual_pacta_sector_override_filename: "" # a single filename of the intended factset_manual_pacta_sector_override RDS (must exist in the `factset_data_path` directory)
update_currencies: TRUE # a single `TRUE` or `FALSE` specifying whether currency data should be pulled on-the-fly (or a previously pulled version should be used)
export_sqlite_files: TRUE # a single `TRUE` or `FALSE` specifying whether sqlite versions of some output files should be included in the outputs
export_archives: FALSE # Boolean: Export zip archives of input files and output files?
imf_quarter_timestamp: "" # a single string specifying the IMF quarter timestamp (for pulling of currency data) in the form "YYYY-QX", e.g. "2021-Q4"
pacta_financial_timestamp: "" # a single string specifying the PACTA quarter timestamp in the form "YYYYQX", e.g. "2021Q4"
market_share_target_reference_year: 0 # a single integer specifying the market share target reference year in the form YYYY, e.g. 2021
time_horizon: 5 # a single integer specifying the time horizon (number of forward looking years) in years in the form N, e.g. 5
scenario_sources_list: [] # an array of strings specifying the scenario sources to be included, e.g. ["ETP2020", "GECO2021"]
sector_list: [] # an array of strings specifying the primary PACTA sectors to be included, e.g. ["Automotive", "Power"]
other_sector_list: [] # an array of strings specifying the additional PACTA sectors to be included, e.g. ["Steel", "Aviation"]
zero_emission_factor_techs: [] # an array of strings specifying the technologies to be considered as zero emission, e.g. ["Electric", "HydroCap"]
green_techs: [] # an array of strings specifying the technologies to be considered "green", e.g. ["FuelCell", "Hybrid"]
scenario_raw_data_to_include: [] # an array of strings specifying the raw scenario data from pacta.scenario.preparation to be included, e.g. ["etp_2020", "geco_2021"]
tech_exclude: [] # an array of strings specifying the technologies to be excluded, e.g. ["OtherCap", "OtherFF"]
scenario_geographies_list: [] # an array of strings specifying the scenario geographies to be included, e.g. ["Global", "NonOECD"]
global_aggregate_scenario_sources_list: [] # an array of strings specifying the scenarios to be used in the global aggregates, e.g. ["ETP2020", "GECO2021"]
global_aggregate_sector_list: [] # an array of strings specifying the sectors to be included in the global aggregates, e.g. ["Power"]
desktop:
inherits: 2023Q4
data_prep_outputs_path: "~/data/pactadatadev/workflow-data-preparation-outputs"
asset_impact_data_path: "~/data/pactarawdata/asset-impact/2024-02-15_AI_RMI_2023Q4"
factset_data_path: "~/data/pactarawdata/factset-extracted/factset-pacta_timestamp-20231231T000000Z_pulled-20240524T132816Z"
scenarios_data_path: "~/data/pactadatadev/workflow-scenario-preparation-outputs/2023Q4_20240701_T105302Z"
docker:
data_prep_outputs_path: "/mnt/outputs"
asset_impact_data_path: "/mnt/asset-impact"
factset_data_path: "/mnt/factset-extracted"
scenarios_data_path: "/mnt/workflow-scenario-preparation-outputs"
2021Q4:
inherits: docker
masterdata_ownership_filename: "2023-06-05_AI_RMI Bespoke_Company Data Products_masterdata_ownership_2021q4.csv"
masterdata_debt_filename: "2023-06-05_AI_RMI Bespoke_Company Data Products_masterdata_debt_2021q4.csv"
ar_company_id__factset_entity_id_filename: "2022-08-17_rmi_ar_fs_id_bridge_2021q4.csv"
factset_financial_data_filename: ""
factset_entity_info_filename: ""
factset_entity_financing_data_filename: ""
factset_fund_data_filename: ""
factset_isin_to_fund_table_filename: ""
factset_iss_emissions_data_filename: ""
factset_issue_code_bridge_filename: ""
factset_industry_map_bridge_filename: ""
factset_manual_pacta_sector_override_filename: ""
imf_quarter_timestamp: "2021-Q4"
pacta_financial_timestamp: "2021Q4"
market_share_target_reference_year: 2021
time_horizon: 5
scenario_sources_list: ["ETP2020", "GECO2021", "IPR2021", "ISF2021", "WEO2021"]
sector_list: ["Automotive", "Power", "Fossil Fuels", "Oil&Gas", "Coal"]
other_sector_list: ["Steel", "Aviation", "Cement"]
zero_emission_factor_techs: ["Electric", "HydroCap", "NuclearCap", "RenewablesCap"]
green_techs: ["FuelCell", "Electric", "Hybrid", "RenewablesCap", "HydroCap", "NuclearCap", "FuelCell_HDV", "Electric_HDV", "Hybrid_HDV"]
scenario_raw_data_to_include: ["etp_2020", "geco_2021", "ipr_2021", "isf_2021", "weo_2021"]
tech_exclude: ["OtherCap", "OtherFF", "Coking Plant", "Sintering Plant", "Direct Or Smelting Reduction Plant", "Pelletizing Plant", "Grinding Plant", "Passenger / Freight"]
scenario_geographies_list: ["Global", "NonOECD", "OECD"]
global_aggregate_scenario_sources_list: ["ETP2020", "GECO2021", "IPR2021", "ISF2021", "WEO2021"]
global_aggregate_sector_list: ["Power"]
2022Q2:
inherits: docker
masterdata_ownership_filename: "2022-08-30_rmi_masterdata_ownership_2022q2.csv"
masterdata_debt_filename: "2022-10-03_rmi_masterdata_debt_2022q2.csv"
ar_company_id__factset_entity_id_filename: "2022-08-17_rmi_ar_fs_id_bridge_2021q4.csv"
factset_financial_data_filename: ""
factset_entity_info_filename: ""
factset_entity_financing_data_filename: ""
factset_fund_data_filename: ""
factset_isin_to_fund_table_filename: ""
factset_iss_emissions_data_filename: ""
factset_issue_code_bridge_filename: ""
factset_industry_map_bridge_filename: ""
factset_manual_pacta_sector_override_filename: ""
imf_quarter_timestamp: "2022-Q2"
pacta_financial_timestamp: "2022Q2"
market_share_target_reference_year: 2022
time_horizon: 5
scenario_sources_list: ["ETP2020", "GECO2021", "IPR2021", "ISF2021", "WEO2021"]
sector_list: ["Automotive", "Power", "Fossil Fuels", "Oil&Gas", "Coal"]
other_sector_list: ["Steel", "Aviation", "Cement"]
zero_emission_factor_techs: ["Electric", "HydroCap", "NuclearCap", "RenewablesCap"]
green_techs: ["FuelCell", "Electric", "Hybrid", "RenewablesCap", "HydroCap", "NuclearCap", "FuelCell_HDV", "Electric_HDV", "Hybrid_HDV"]
scenario_raw_data_to_include: ["etp_2020", "geco_2021", "ipr_2021", "isf_2021", "weo_2021"]
tech_exclude: ["OtherCap", "OtherFF", "Coking Plant", "Sintering Plant", "Direct Or Smelting Reduction Plant", "Pelletizing Plant", "Grinding Plant", "Passenger / Freight"]
scenario_geographies_list: ["Global", "NonOECD", "OECD"]
global_aggregate_scenario_sources_list: ["ETP2020", "GECO2021", "IPR2021", "ISF2021", "WEO2021"]
global_aggregate_sector_list: ["Power"]
2022Q4:
inherits: docker
masterdata_ownership_filename: "2023-06-18_AI_RMI Bespoke_Company Data Products_masterdata_ownership_2022Q4.csv"
masterdata_debt_filename: "2023-06-18_AI_RMI Bespoke_Company Data Products_masterdata_debt_2022Q4.csv"
ar_company_id__factset_entity_id_filename: "2023-02-15_AI_RMI_Bespoke_Company_Data_Products_Company_ID_List_2022Q4.csv"
factset_financial_data_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_financial_data.rds"
factset_entity_info_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_entity_info.rds"
factset_entity_financing_data_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_entity_financing_data.rds"
factset_fund_data_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_fund_data.rds"
factset_isin_to_fund_table_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_isin_to_fund_table.rds"
factset_iss_emissions_data_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_iss_emissions.rds"
factset_issue_code_bridge_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_issue_code_bridge.rds"
factset_industry_map_bridge_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_industry_map_bridge.rds"
factset_manual_pacta_sector_override_filename: "timestamp-20221231T000000Z_pulled-20240217T134528Z_factset_manual_sector_override.rds"
imf_quarter_timestamp: "2022-Q4"
pacta_financial_timestamp: "2022Q4"
market_share_target_reference_year: 2022
time_horizon: 5
scenario_sources_list: ["GECO2022", "ISF2021", "WEO2022"]
sector_list: ["Automotive", "Power", "Oil&Gas", "Coal"]
other_sector_list: ["Steel", "Aviation", "Cement"]
zero_emission_factor_techs: ["Electric", "HydroCap", "NuclearCap", "RenewablesCap"]
green_techs: ["FuelCell", "Electric", "Hybrid", "RenewablesCap", "HydroCap", "NuclearCap", "FuelCell_HDV", "Electric_HDV", "Hybrid_HDV"]
scenario_raw_data_to_include: ["geco_2022", "isf_2021", "weo_2022"]
tech_exclude: ["OtherCap", "OtherFF", "Coking Plant", "Sintering Plant", "Direct Or Smelting Reduction Plant", "Pelletizing Plant", "Grinding Plant", "Passenger / Freight"]
scenario_geographies_list: ["Global", "NonOECD", "OECD"]
global_aggregate_scenario_sources_list: ["WEO2022"]
global_aggregate_sector_list: ["Power"]
2022Q4_azure:
inherits: 2022Q4
export_archives: TRUE
data_prep_outputs_path: "/mnt/outputs"
asset_impact_data_path: "/mnt/asset-impact"
factset_data_path: "/mnt/factset-extracted/factset-pacta_timestamp-20221231T000000Z_pulled-20240217T134528Z"
scenarios_data_path: "/mnt/workflow-scenario-preparation-outputs/2022Q4_20240418_T131922Z"
# Asset impact files are stored in separate subdirectories on Azure File Share.
masterdata_ownership_filename: "2023-06-18/2023-06-18_AI_RMI Bespoke_Company Data Products_masterdata_ownership_2022Q4.csv"
masterdata_debt_filename: "2023-06-18/2023-06-18_AI_RMI Bespoke_Company Data Products_masterdata_debt_2022Q4.csv"
ar_company_id__factset_entity_id_filename: "2023-02-15/2023-02-15_AI_RMI_Bespoke_Company_Data_Products_Company_ID_List_2022Q4.csv"
2023Q4:
inherits: docker
masterdata_ownership_filename: "2024-02-14_AI_RMI Bespoke_Company Data Products_masterdata_ownership_2023Q4.csv"
masterdata_debt_filename: "2024-02-14_AI_RMI Bespoke_Company Data Products_masterdata_debt_2023Q4.csv"
ar_company_id__factset_entity_id_filename: "2024-02-14_AI_RMI_Bespoke_Company_Data_Products_Company_ID_List_2023Q4.csv"
factset_financial_data_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_financial_data.rds"
factset_entity_info_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_entity_info.rds"
factset_entity_financing_data_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_entity_financing_data.rds"
factset_fund_data_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_fund_data.rds"
factset_isin_to_fund_table_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_isin_to_fund_table.rds"
factset_iss_emissions_data_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_iss_emissions.rds"
factset_issue_code_bridge_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_issue_code_bridge.rds"
factset_industry_map_bridge_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_industry_map_bridge.rds"
factset_manual_pacta_sector_override_filename: "timestamp-20231231T000000Z_pulled-20240524T132816Z_factset_manual_sector_override.rds"
imf_quarter_timestamp: "2023-Q4"
pacta_financial_timestamp: "2023Q4"
market_share_target_reference_year: 2023
time_horizon: 5
scenario_sources_list: ["GECO2023", "ISF2023", "WEO2023"]
sector_list: ["Automotive", "Power", "Oil&Gas", "Coal"]
other_sector_list: ["Steel", "Aviation", "Cement"]
zero_emission_factor_techs: ["Electric", "HydroCap", "NuclearCap", "RenewablesCap"]
green_techs: ["FuelCell", "Electric", "Hybrid", "RenewablesCap", "HydroCap", "NuclearCap", "FuelCell_HDV", "Electric_HDV", "Hybrid_HDV"]
scenario_raw_data_to_include: ["geco_2023", "isf_2023", "weo_2023"]
tech_exclude: ["OtherCap", "OtherFF", "Coking Plant", "Sintering Plant", "Direct Or Smelting Reduction Plant", "Pelletizing Plant", "Grinding Plant", "Passenger / Freight"]
scenario_geographies_list: ["Global", "NonOECD", "OECD"]
global_aggregate_scenario_sources_list: ["WEO2023"]
global_aggregate_sector_list: ["Power"]
2023Q4_azure:
inherits: 2023Q4
export_archives: TRUE
data_prep_outputs_path: "/mnt/outputs"
asset_impact_data_path: "/mnt/asset-impact/2024-02-15_AI_RMI_2023Q4"
factset_data_path: "/mnt/factset-extracted/factset-pacta_timestamp-20231231T000000Z_pulled-20240524T132816Z"
scenarios_data_path: "/mnt/workflow-scenario-preparation-outputs/2023Q4_20240701_T105302Z"