[pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
2024-02-23 12:56:43 +00:00 · 2024-02-23 12:56:43 +00:00 · ace51b9e55
commit ace51b9e55
parent 3298572ced
2 changed files with 106 additions and 69 deletions
--- a/rules/common.smk
+++ b/rules/common.smk
@ -137,6 +137,7 @@ def input_eurostat(w):
    else:
        return "data/bundle-sector/eurostat-energy_balances-april_2023_edition"
 def solved_previous_horizon(w):
    planning_horizons = config_provider("scenario", "planning_horizons")(w)
    i = planning_horizons.index(int(w.planning_horizons))
--- a/scripts/build_energy_totals.py
+++ b/scripts/build_energy_totals.py
@ -8,6 +8,7 @@ Build total energy demands per country using JRC IDEES, eurostat, and EEA data.
 import logging
 import multiprocessing as mp
 import os
 from functools import partial
 import country_converter as coco
@ -16,7 +17,6 @@ import numpy as np
 import pandas as pd
 from _helpers import configure_logging, mute_print, set_scenario_config
 from tqdm import tqdm
 import os
 cc = coco.CountryConverter()
 logger = logging.getLogger(__name__)
@ -155,35 +155,47 @@ def build_eurostat(input_eurostat, countries, report_year, year):
    else:
        # read in every country file in countries
        eurostat = pd.DataFrame()
-        countries = [country if country != 'GB' else 'UK' for country in countries]
+        countries = [country if country != "GB" else "UK" for country in countries]
-        countries = [country if country != 'GR' else 'EL' for country in countries]
+        countries = [country if country != "GR" else "EL" for country in countries]
        for country in countries:
            filename = f"/{country}-Energy-balance-sheets-April-2023-edition.xlsb"
            if os.path.exists(input_eurostat + filename):
                df = pd.read_excel(
                    input_eurostat + filename,
-                    engine='pyxlsb',
+                    engine="pyxlsb",
                    sheet_name=str(year),
                    skiprows=4,
-                    index_col=list(range(4)))
+                    index_col=list(range(4)),
                )
                # replace entry 'Z' with 0
-                df.replace('Z', 0, inplace=True)
+                df.replace("Z", 0, inplace=True)
                # write 'International aviation' to the 2nd level of the multiindex
-                index_number = (df.index.get_level_values(1) == 'International aviation').argmax()
+                index_number = (
-                new_index = ('-', 'International aviation', 'International aviation', 'ktoe')
+                    df.index.get_level_values(1) == "International aviation"
                ).argmax()
                new_index = (
                    "-",
                    "International aviation",
                    "International aviation",
                    "ktoe",
                )
                modified_index = list(df.index)
                modified_index[index_number] = new_index
-                df.index = pd.MultiIndex.from_tuples(modified_index, names=df.index.names)
+                df.index = pd.MultiIndex.from_tuples(
                    modified_index, names=df.index.names
                )
                # drop the annoying subhead line
                df.drop(df[df[year] == year].index, inplace=True)
                # replace 'Z' with 0
-                df = df.replace('Z', 0)
+                df = df.replace("Z", 0)
                # add country to the multiindex
                new_tuple = [(country, *idx) for idx in df.index]
-                new_mindex = pd.MultiIndex.from_tuples(new_tuple, names=['country', None, 'name', None, 'unit'])
+                new_mindex = pd.MultiIndex.from_tuples(
                    new_tuple, names=["country", None, "name", None, "unit"]
                )
                df.index = new_mindex
                # make numeric values where possible
-                df = df.apply(pd.to_numeric, errors='coerce')
+                df = df.apply(pd.to_numeric, errors="coerce")
                # drop non-numeric columns
                non_numeric_cols = df.columns[df.dtypes != float]
                df.drop(non_numeric_cols, axis=1, inplace=True)
@ -193,19 +205,30 @@ def build_eurostat(input_eurostat, countries, report_year, year):
        eurostat.drop(["Unnamed: 4", year, "Unnamed: 6"], axis=1, inplace=True)
        # Renaming some indices
        rename = {
-            'Households': 'Residential',
+            "Households": "Residential",
-            'Commercial & public services': 'Services',
+            "Commercial & public services": "Services",
-            'Domestic navigation': 'Domestic Navigation'
+            "Domestic navigation": "Domestic Navigation",
        }
        for name, rename in rename.items():
            eurostat.index = eurostat.index.set_levels(
-            eurostat.index.levels[3].where(eurostat.index.levels[3] != name, rename),
+                eurostat.index.levels[3].where(
-            level=3)
+                    eurostat.index.levels[3] != name, rename
-        new_index = eurostat.index.set_levels(eurostat.index.levels[2].where(eurostat.index.levels[2] != 'International maritime bunkers', 'Bunkers'), level=2)
+                ),
                level=3,
            )
        new_index = eurostat.index.set_levels(
            eurostat.index.levels[2].where(
                eurostat.index.levels[2] != "International maritime bunkers", "Bunkers"
            ),
            level=2,
        )
        eurostat.index = new_index
-        eurostat.rename(columns={'Total': 'Total all products'}, inplace=True)
+        eurostat.rename(columns={"Total": "Total all products"}, inplace=True)
-        eurostat.index = eurostat.index.set_levels(eurostat.index.levels[0].where(eurostat.index.levels[0] != 'UK', 'GB'), level=0)
+        eurostat.index = eurostat.index.set_levels(
            eurostat.index.levels[0].where(eurostat.index.levels[0] != "UK", "GB"),
            level=0,
        )
        df = eurostat * 11.63 / 1e3
@ -751,7 +774,9 @@ def build_co2_totals(countries, eea_co2, eurostat_co2, report_year):
                "industrial non-elec": (ct, "+", "Industry"),
                # does not include non-energy emissions
                "agriculture": (eurostat_co2.index.get_level_values(0) == ct)
-                & eurostat_co2.index.isin(["Agriculture / Forestry", "Fishing"], level=3),
+                & eurostat_co2.index.isin(
                    ["Agriculture / Forestry", "Fishing"], level=3
                ),
            }
        else:
            mappings = {
@ -768,7 +793,9 @@ def build_co2_totals(countries, eea_co2, eurostat_co2, report_year):
                "industrial non-elec": (ct, "+", "Industry sector"),
                # does not include non-energy emissions
                "agriculture": (eurostat_co2.index.get_level_values(0) == ct)
-                & eurostat_co2.index.isin(["Agriculture & forestry", "Fishing"], level=3),
+                & eurostat_co2.index.isin(
                    ["Agriculture & forestry", "Fishing"], level=3
                ),
            }
        for i, mi in mappings.items():
@ -812,20 +839,26 @@ def build_transport_data(countries, population, idees):
    return transport_data
 def rescale(idees_countries, energy, eurostat):
-    '''
+    """
-    Takes JRC IDEES data from 2015 and rescales it by the ratio of the 
+    Takes JRC IDEES data from 2015 and rescales it by the ratio of the eurostat
-    eurostat data and the 2015 eurostat data.
+    data and the 2015 eurostat data.
    missing data: ['passenger car efficiency', 'passenger cars']
-    '''
+    """
    # read in the eurostat data for 2015
-    eurostat_2015 = build_eurostat(input_eurostat, countries, 2023, 2015)[["Total all products", "Electricity"]]
+    eurostat_2015 = build_eurostat(input_eurostat, countries, 2023, 2015)[
        ["Total all products", "Electricity"]
    ]
    # eurostat_2015 = eurostat_2015.rename(index={'GB': 'UK'}, level=0)
    eurostat_year = eurostat[["Total all products", "Electricity"]]
    # calculate the ratio of the two data sets
    ratio = eurostat_year / eurostat_2015
-    ratio = ratio.droplevel([1,4])
+    ratio = ratio.droplevel([1, 4])
-    ratio.rename(columns={"Total all products": "total", "Electricity": "ele"}, inplace=True)
+    ratio.rename(
        columns={"Total all products": "total", "Electricity": "ele"}, inplace=True
    )
    ratio = ratio.rename(index={"GB": "UK"}, level=0)
    residential_total = [
@ -892,54 +925,55 @@ def rescale(idees_countries, energy, eurostat):
    ]
    avia_inter = [
-        'total aviation passenger',
+        "total aviation passenger",
-        'total aviation freight',
+        "total aviation freight",
-        'total international aviation passenger',
+        "total international aviation passenger",
-        'total international aviation freight',
+        "total international aviation freight",
-        'total international aviation'
+        "total international aviation",
    ]
    avia_domestic = [
-        'total domestic aviation passenger',
+        "total domestic aviation passenger",
-        'total domestic aviation freight',
+        "total domestic aviation freight",
-        'total domestic aviation',
+        "total domestic aviation",
    ]
    navigation = [
        "total domestic navigation",
    ]
-    idees_countries = idees_countries.repalce({'GB': 'UK', 'GR': 'EL'})
+    idees_countries = idees_countries.repalce({"GB": "UK", "GR": "EL"})
    for country in idees_countries:
-        res = ratio.loc[(country, slice(None), 'Residential')]
+        res = ratio.loc[(country, slice(None), "Residential")]
-        energy.loc[country, residential_total] *= res[['total']].iloc[0,0]
+        energy.loc[country, residential_total] *= res[["total"]].iloc[0, 0]
-        energy.loc[country, residential_ele] *= res[['ele']].iloc[0,0]
+        energy.loc[country, residential_ele] *= res[["ele"]].iloc[0, 0]
-        ser = ratio.loc[(country, slice(None), 'Services')]
+        ser = ratio.loc[(country, slice(None), "Services")]
-        energy.loc[country, service_total] *= ser[['total']].iloc[0,0]
+        energy.loc[country, service_total] *= ser[["total"]].iloc[0, 0]
-        energy.loc[country, service_ele] *= ser[['ele']].iloc[0,0]
+        energy.loc[country, service_ele] *= ser[["ele"]].iloc[0, 0]
-        agri = ratio.loc[(country, slice(None), 'Agriculture & forestry')]
+        agri = ratio.loc[(country, slice(None), "Agriculture & forestry")]
-        energy.loc[country, agri_total] *= agri[['total']].iloc[0,0]
+        energy.loc[country, agri_total] *= agri[["total"]].iloc[0, 0]
-        energy.loc[country, agri_ele] *= agri[['ele']].iloc[0,0]
+        energy.loc[country, agri_ele] *= agri[["ele"]].iloc[0, 0]
-        road = ratio.loc[(country, slice(None), 'Road')]
+        road = ratio.loc[(country, slice(None), "Road")]
-        energy.loc[country, road_total] *= road[['total']].iloc[0,0]
+        energy.loc[country, road_total] *= road[["total"]].iloc[0, 0]
-        energy.loc[country, road_ele] *= road[['ele']].iloc[0,0]
+        energy.loc[country, road_ele] *= road[["ele"]].iloc[0, 0]
-        rail = ratio.loc[(country, slice(None), 'Rail')]
+        rail = ratio.loc[(country, slice(None), "Rail")]
-        energy.loc[country, rail_total] *= rail[['total']].iloc[0,0]
+        energy.loc[country, rail_total] *= rail[["total"]].iloc[0, 0]
-        energy.loc[country, rail_ele] *= rail[['ele']].iloc[0,0]
+        energy.loc[country, rail_ele] *= rail[["ele"]].iloc[0, 0]
-        avi_d = ratio.loc[(country, slice(None), 'Domestic aviation')]
+        avi_d = ratio.loc[(country, slice(None), "Domestic aviation")]
-        avi_i = ratio.loc[(country, 'International aviation', slice(None))]
+        avi_i = ratio.loc[(country, "International aviation", slice(None))]
-        energy.loc[country, avia_inter] *= avi_i[['total']].iloc[0,0]
+        energy.loc[country, avia_inter] *= avi_i[["total"]].iloc[0, 0]
-        energy.loc[country, avia_domestic] *= avi_d[['total']].iloc[0,0]
+        energy.loc[country, avia_domestic] *= avi_d[["total"]].iloc[0, 0]
-        nav = ratio.loc[(country, slice(None), 'Domestic Navigation')]
+        nav = ratio.loc[(country, slice(None), "Domestic Navigation")]
-        energy.loc[country, navigation] *= nav[['total']].iloc[0,0]
+        energy.loc[country, navigation] *= nav[["total"]].iloc[0, 0]
    return energy
 if __name__ == "__main__":
    if "snakemake" not in globals():
        from _helpers import mock_snakemake
@ -977,7 +1011,9 @@ if __name__ == "__main__":
    energy.to_csv(snakemake.output.energy_name)
    # use rescaled idees data to calculate district heat share
-    district_heat_share = build_district_heat_share(countries, energy.loc[idees_countries])
+    district_heat_share = build_district_heat_share(
        countries, energy.loc[idees_countries]
    )
    district_heat_share.to_csv(snakemake.output.district_heat_share)
    base_year_emissions = params["base_emissions_year"]