calliope-project · brynpickering · Jul 9, 2024 · Apr 10, 2024 · Apr 10, 2024 · Apr 11, 2024
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -4,7 +4,7 @@
 
 ### Added (models)
 
-* **ADD** industry module and steel industry energy demand processing. NOT CONNECTED TO THE MAIN WORKFLOW. Industry sectors pending: chemical, "other". (Fixes #308, #310, #347, #345 and #346)
+* **ADD** industry module and steel industry energy demand processing. NOT CONNECTED TO THE MAIN WORKFLOW. Industry sectors pending: chemical. (Fixes #308, #309, #310, #347, #345 and #346)
 
 * **ADD** Spatial resolution that aligns with the regions defined by the [e-Highway 2050 project](https://cordis.europa.eu/project/id/308908/reporting) (`ehighways`) (#370).
 

diff --git a/modules/industry/config.yaml b/modules/industry/config.yaml
@@ -9,5 +9,10 @@ industry:
         placeholder-out1:
         placeholder-out2:
     params:
-        steel:
+        non-generic-categories: ["Iron and steel", "Chemicals Industry"]
+        steel-config:
             recycled-steel-share: 0.5  # % of recycled scrap steel for H-DRI
+        generic-config:
+            final-energy-method: "by priority"
+            final-energy-carriers: ["Electricity", "Natural gas (incl. biogas)", "Diesel oil (incl. biofuels)"]
+            useful-demands: ["Low enthalpy heat"]
diff --git a/modules/industry/industry.smk b/modules/industry/industry.smk
@@ -13,36 +13,46 @@ validate(config, "./schema.yaml")
 
 # Ensure rules are defined in order.
 # Otherwise commands like "rules.rulename.output" won't work!
-rule steel_industry:
-    message: "Calculate energy demand for the 'Iron and steel' sector in JRC-IDEES."
+if "Iron and steel" in config["params"]["non-generic-categories"]:
+    rule steel_processing:
+        message: "Calculate energy demand for the 'Iron and steel' sector in JRC-IDEES."
+        conda: CONDA_PATH
+        params:
+            steel_config = config["params"]["steel-config"]
+        input:
+            path_energy_balances = config["inputs"]["path-energy-balances"],
+            path_cat_names = config["inputs"]["path-cat-names"],
+            path_carrier_names = config["inputs"]["path-carrier-names"],
+            path_jrc_industry_energy = config["inputs"]["path-jrc-industry-energy"],
+            path_jrc_industry_production = config["inputs"]["path-jrc-industry-production"],
+        output:
+            path_output = f"{BUILD_PATH}/annual_demand_steel.nc"
+        script: f"{SCRIPT_PATH}/steel_processing.py"
+
+if "Chemicals Industry" in config["params"]["non-generic-categories"]:
+    rule chemicals_processing:
+        message: "."
+        conda: CONDA_PATH
+        params:
+        input:
+        output:
+        script: f"{SCRIPT_PATH}/chemicals_processing.py"
+
+rule generic_processing:
+    message: "Calculate energy demand for all other industry sectors in JRC-IDEES."
     conda: CONDA_PATH
     params:
-        config_steel = config["params"]["steel"]
+        non_generic_categories = config["params"]["non-generic-categories"],
+        generic_config = config["params"]["generic-config"],
     input:
         path_energy_balances = config["inputs"]["path-energy-balances"],
         path_cat_names = config["inputs"]["path-cat-names"],
         path_carrier_names = config["inputs"]["path-carrier-names"],
         path_jrc_industry_energy = config["inputs"]["path-jrc-industry-energy"],
         path_jrc_industry_production = config["inputs"]["path-jrc-industry-production"],
     output:
-        path_output = f"{BUILD_PATH}/annual_demand_steel.nc"
-    script: f"{SCRIPT_PATH}/steel_industry.py"
-
-rule chemical_industry:
-    message: "."
-    conda: CONDA_PATH
-    params:
-    input:
-    output:
-    script: f"{SCRIPT_PATH}/chemicals.py"
-
-rule other_industry:
-    message: "."
-    conda: CONDA_PATH
-    params:
-    input:
-    output: f"{BUILD_PATH}/other_industry.csv"
-    script: f"{SCRIPT_PATH}/other_industry.py"
+        path_output = f"{BUILD_PATH}/annual_demand_generic.nc"
+    script: f"{SCRIPT_PATH}/generic_processing.py"
 
 # rule combine_and_scale:
 #     message: "."

diff --git a/modules/industry/schema.yaml b/modules/industry/schema.yaml
@@ -38,7 +38,14 @@ properties:
         additionalProperties: false
         description: Parameters allow users to configure module behaviour.
         properties:
-            steel:
+            non-generic-categories:
+                type: array
+                description: "Specifies which JRC industry categories will be processed separately."
+                uniqueItems: true
+                items:
+                    type: string
+                    enum: ["Iron and steel", "Chemicals Industry"]
+            steel-config:
                 type: object
                 additionalProperties: false
                 description: "Parameters specific to the 'Iron and steel' industry category."
@@ -48,3 +55,30 @@ properties:
                         description: "Share of recycled metal in the H-DRI steel process."
                         minimum: 0
                         maximum: 1
+            generic-config:
+                type: object
+                additionalProperties: false
+                description: "Parameters for default/generic category processing."
+                properties:
+                    final-energy-method:
+                        description: |
+                            Processing method for final-demand.
+                            - "by priority": will take the carriers specified in "final-energy-carriers" in order of importance (first subtracts from second, etc.).
+                            - "keep everything": will keep all the final carrier demands with no assumptions.
+                        type: string
+                        enum: ["by priority", "keep everything"]
+                    final-energy-carriers:
+                        type: array
+                        description: "Final energy carriers to take, if relevant."
+                        uniqueItems: true
+                        items:
+                            type: string
+                    useful-demands:
+                        type: array
+                        description: |
+                            Demands to select from 'useful' rather than 'final' energy consumption data.
+                            Accepts any pre-processed JRC IDEES 'subsection' names.
+                            Always subtracted from 'final' energy demand to avoid double-counting.
+                        uniqueItems: true
+                        items:
+                            type: string
diff --git a/...les/industry/scripts/chemical_industry.py → .../industry/scripts/chemicals_processing.py b/...les/industry/scripts/chemical_industry.py → .../industry/scripts/chemicals_processing.py
diff --git a/modules/industry/scripts/generic_processing.py b/modules/industry/scripts/generic_processing.py
@@ -0,0 +1,142 @@
+from typing import Optional
+
+import pandas as pd
+import xarray as xr
+from utils import filling
+from utils import jrc_idees_parser as jrc
+
+
+def get_generic_demand(
+    non_generic_categories: list,
+    generic_config: dict,
+    path_energy_balances: str,
+    path_cat_names: str,
+    path_carrier_names: str,
+    path_jrc_industry_energy: str,
+    path_jrc_industry_production: str,
+    path_output: Optional[str] = None,
+) -> xr.DataArray:
+    """Processing of industry categories not selected for individual processing.
+
+    Merges all energy demand into a single `generic` category using a configurable data processing pipeline.
+
+    Args:
+        non_generic_categories (list): categories with separate processing (will be ignored).
+        generic_config (dict): configuration for generic category processing.
+        path_energy_balances (str): country energy balances (usually from eurostat).
+        path_cat_names (str): eurostat category mapping file.
+        path_carrier_names (str): eurostat carrier name mapping file.
+        path_jrc_industry_energy (str): jrc country-specific industrial energy demand file.
+        path_jrc_industry_production (str): jrc country-specific industrial production file.
+        path_output (str): location of steel demand output file.
+
+    Returns:
+        pd.DataFrame: dataframe with industrial demand per country.
+    """
+    # Load data
+    energy_balances_df = pd.read_csv(
+        path_energy_balances, index_col=[0, 1, 2, 3, 4]
+    ).squeeze("columns")
+    cat_names_df = pd.read_csv(path_cat_names, header=0, index_col=0)
+    carrier_names_df = pd.read_csv(path_carrier_names, header=0, index_col=0)
+    jrc_energy = xr.open_dataset(path_jrc_industry_energy)
+    jrc_prod = xr.open_dataarray(path_jrc_industry_production)
+
+    # Remove data from all specifically processed industries
+    cat_names_df = cat_names_df[~cat_names_df["jrc_idees"].isin(non_generic_categories)]
+    jrc_energy = jrc_energy.drop_sel(cat_name=non_generic_categories)
+    jrc_prod = jrc_prod.drop_sel(cat_name=non_generic_categories)
+
+    # Process data:
+    # Extract useful dem. -> remove useful dem. from rest -> extract final dem.
+    selected_useful = generic_config["useful-demands"]
+    other_useful_demand = jrc.convert_subsection_demand_to_carrier(
+        jrc_energy, selected_useful
+    )
+
+    final_method = generic_config["final-energy-method"]
+    jrc_energy = jrc_energy.drop_sel(subsection=selected_useful)
+
+    match final_method:
+        case "by priority":
+            other_final_demand = transform_final_demand_by_priority(
+                jrc_energy, generic_config["final-energy-carriers"]
+            )
+        case "keep everything":
+            other_final_demand = jrc_energy["final"].sum(["section", "subsection"])
+            other_final_demand = jrc.standardize(other_final_demand, "twh")
+        case _:
+            raise ValueError(f"Unsupported final energy method: {final_method}.")
+
+    # Combine and fill missing countries
+    other_demand = xr.concat(
+        [other_useful_demand, other_final_demand], dim="carrier_name"
+    )
+
+    other_demand = filling.fill_missing_countries_years(
+        energy_balances_df, cat_names_df, carrier_names_df, other_demand
+    )
+
+    other_demand = jrc.standardize(other_demand, "twh")
+
+    if path_output:
+        other_demand.to_netcdf(path_output)
+
+    return other_demand
+
+
+def transform_final_demand_by_priority(
+    jrc_energy: xr.Dataset, carrier_priority: list[str]
+) -> xr.DataArray:
+    """Transform final demand of generic categories by giving priority to certain carriers.
+
+    Steps:
+    1. Assume that all demand that could consume a carrier will be met by said carrier.
+    2. Drop overlapping consumption so that demand is met by carriers with the given priority.
+    3. Combine.
+
+    E.g., if carrier priority is [Electricity, Natural gas, Diesel] then:
+    - Electricity: if met exclusively or otherwise, it's final electrical demand.
+    - Natural gas: if met exclusively or otherwise, EXCEPT for overlapping cases with Electricity.
+    - Diesel: if met exclusively or otherwise, EXCEPT for overlapping cases with all the above.
+
+    Args:
+        jrc_energy (xr.Dataset): JRC energy dataset.
+        carrier_priority (list[str]): carriers to take in order of priority.
+
+    Returns:
+        xr.DataArray: dataset filled with demands for the given carriers.
+    """
+    carrier_final_dem = {}
+
+    for carrier in carrier_priority:
+        dem_replaced = jrc.replace_final_demand_by_carrier(carrier, jrc_energy)
+        dem_replaced = dem_replaced.to_dataframe().dropna()
+        for dem_replaced_prev in carrier_final_dem.values():
+            dem_replaced = dem_replaced.drop(dem_replaced_prev.index, errors="ignore")
+        carrier_final_dem[carrier] = dem_replaced
+
+    for carrier, df in carrier_final_dem.items():
+        carrier_final_dem[carrier] = (
+            df["final"].to_xarray().assign_coords(carrier_name=carrier)
+        )
+
+    final_dem = xr.concat(carrier_final_dem.values(), dim="carrier_name")
+    final_dem = final_dem.sum(["section", "subsection"])
+
+    final_dem = jrc.standardize(final_dem, "twh")
+
+    return final_dem
+
+
+if __name__ == "__main__":
+    get_generic_demand(
+        non_generic_categories=snakemake.params.non_generic_categories,
+        generic_config=snakemake.params.generic_config,
+        path_energy_balances=snakemake.input.path_energy_balances,
+        path_cat_names=snakemake.input.path_cat_names,
+        path_carrier_names=snakemake.input.path_carrier_names,
+        path_jrc_industry_energy=snakemake.input.path_jrc_industry_energy,
+        path_jrc_industry_production=snakemake.input.path_jrc_industry_production,
+        path_output=snakemake.output.path_output,
+    )
diff --git a/modules/industry/scripts/other_industry.py b/modules/industry/scripts/other_industry.py
diff --git a/modules/industry/scripts/steel_industry.py → modules/industry/scripts/steel_processing.py b/modules/industry/scripts/steel_industry.py → modules/industry/scripts/steel_processing.py
@@ -18,7 +18,7 @@ def _get_h2_to_steel(recycled_steel_share: float) -> float:
 
 
 def get_steel_demand_df(
-    config_steel: dict,
+    steel_config: dict,
     path_energy_balances: str,
     path_cat_names: str,
     path_carrier_names: str,
@@ -29,7 +29,7 @@ def get_steel_demand_df(
     """Execute the data processing pipeline for the "Iron and steel" sub-sector.
 
     Args:
-        config_steel (dict): steel sector configuration.
+        steel_config (dict): steel sector configuration.
         path_energy_balances (str): country energy balances (usually from eurostat).
         path_cat_names (str): eurostat category mapping file.
         path_carrier_names (str): eurostat carrier name mapping file.
@@ -56,7 +56,7 @@ def get_steel_demand_df(
 
     # Process data
     new_steel_demand = transform_jrc_subsector_demand(
-        jrc_energy, jrc_prod, config_steel
+        jrc_energy, jrc_prod, steel_config
     )
     new_steel_demand = filling.fill_missing_countries_years(
         energy_balances_df, cat_names_df, carrier_names_df, new_steel_demand
@@ -99,7 +99,7 @@ def transform_jrc_subsector_demand(
         xr.Dataset: processed dataframe with the expected steel energy consumption.
     """
     # Gather relevant industrial processes
-    sintering_intensity = jrc.get_subsection_final_intensity(
+    sintering_intensity = jrc.get_sec_subsec_final_intensity(
         "Integrated steelworks",
         "Steel: Sinter/Pellet making",
         "Integrated steelworks",
@@ -109,7 +109,7 @@ def transform_jrc_subsector_demand(
         fill_empty=True,
     )
 
-    eaf_smelting_intensity = jrc.get_subsection_final_intensity(
+    eaf_smelting_intensity = jrc.get_sec_subsec_final_intensity(
         "Electric arc",
         "Steel: Smelters",
         "Electric arc",
@@ -118,7 +118,7 @@ def transform_jrc_subsector_demand(
         jrc_prod,
         fill_empty=True,
     )
-    eaf_intensity = jrc.get_subsection_final_intensity(
+    eaf_intensity = jrc.get_sec_subsec_final_intensity(
         "Electric arc",
         "Steel: Electric arc",
         "Electric arc",
@@ -127,7 +127,7 @@ def transform_jrc_subsector_demand(
         jrc_prod,
         fill_empty=True,
     )
-    refining_intensity = jrc.get_subsection_final_intensity(
+    refining_intensity = jrc.get_sec_subsec_final_intensity(
         "Electric arc",
         "Steel: Furnaces, Refining and Rolling",
         "Electric arc",
@@ -136,7 +136,7 @@ def transform_jrc_subsector_demand(
         jrc_prod,
         fill_empty=True,
     )
-    finishing_intensity = jrc.get_subsection_final_intensity(
+    finishing_intensity = jrc.get_sec_subsec_final_intensity(
         "Electric arc",
         "Steel: Products finishing",
         "Electric arc",
@@ -145,7 +145,7 @@ def transform_jrc_subsector_demand(
         jrc_prod,
         fill_empty=True,
     )
-    auxiliary_intensity = jrc.get_auxiliary_electric_final_intensity(
+    auxiliary_intensity = jrc.get_sec_final_intensity_auxiliary_electric(
         "Electric arc", "Electric arc", jrc_energy, jrc_prod, fill_empty=True
     )
 
@@ -182,21 +182,22 @@ def transform_jrc_subsector_demand(
     electric_intensity = electric_intensity.where(
         electric_intensity > 0, other=mean_demand_per_year
     )
-    electric_intensity = electric_intensity.assign_coords(carrier_name="electricity")
 
     # Hydrogen consumption for H-DRI:
     # only for country/year that handle iron ore and don't recycle all their steel
     h_dri_h2_intensity = H2_LHV_KTOE * _get_h2_to_steel(recycled_share)
 
     h2_intensity = electric_intensity.where(sintering_intensity > 0).fillna(0)
     h2_intensity = h2_intensity.where(h2_intensity == 0, h_dri_h2_intensity)
-    h2_intensity = h2_intensity.assign_coords(carrier_name="hydrogen")
+    h2_intensity = h2_intensity.assign_coords(carrier_name="Hydrogen")
 
     # Low heat
-    low_heat_intensity = jrc.get_subsection_useful_intensity(
+    low_heat_intensity = jrc.get_section_subsection_useful_intensity(
         "Electric arc", "Low enthalpy heat", "Electric arc", jrc_energy, jrc_prod
     )
-    low_heat_intensity = low_heat_intensity.assign_coords(carrier_name="space_heat")
+    low_heat_intensity = low_heat_intensity.assign_coords(
+        carrier_name="Low enthalpy heat"
+    )
 
     # Combine and transform to energy demand
     total_intensity = xr.concat(
@@ -213,7 +214,7 @@ def transform_jrc_subsector_demand(
 
 if __name__ == "__main__":
     get_steel_demand_df(
-        config_steel=snakemake.params.config_steel,
+        steel_config=snakemake.params.steel_config,
         path_energy_balances=snakemake.input.path_energy_balances,
         path_cat_names=snakemake.input.path_cat_names,
         path_carrier_names=snakemake.input.path_carrier_names,