pypsa-eur/scripts/build_gas_input_locations.py

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

188 lines
6.0 KiB
Python
Raw Normal View History

# -*- coding: utf-8 -*-
2024-02-19 15:21:48 +00:00
# SPDX-FileCopyrightText: : 2021-2024 The PyPSA-Eur Authors
2023-03-06 17:49:23 +00:00
#
# SPDX-License-Identifier: MIT
"""
Build import locations for fossil gas from entry-points, LNG terminals and
2023-03-09 11:45:43 +00:00
production sites with data from SciGRID_gas and Global Energy Monitor.
"""
import json
import logging
import geopandas as gpd
import pandas as pd
2024-02-12 10:53:20 +00:00
from _helpers import configure_logging, set_scenario_config
from cluster_gas_network import load_bus_regions
2024-01-19 09:47:58 +00:00
logger = logging.getLogger(__name__)
def read_scigrid_gas(fn):
df = gpd.read_file(fn)
expanded_param = df.param.apply(json.loads).apply(pd.Series)
df = pd.concat([df, expanded_param], axis=1)
df.drop(["param", "uncertainty", "method"], axis=1, inplace=True)
return df
def build_gem_lng_data(fn):
df = pd.read_excel(fn, sheet_name="LNG terminals - data")
df = df.set_index("ComboID")
remove_country = ["Cyprus", "Turkey"] # noqa: F841
remove_terminal = [ # noqa: F841
"Puerto de la Luz LNG Terminal",
"Gran Canaria LNG Terminal",
]
status_list = ["Operating", "Construction"] # noqa: F841
df = df.query(
"Status in @status_list \
& FacilityType == 'Import' \
& Country != @remove_country \
& TerminalName != @remove_terminal \
& CapacityInMtpa != '--' \
& CapacityInMtpa != 0"
)
geometry = gpd.points_from_xy(df["Longitude"], df["Latitude"])
gdf = gpd.GeoDataFrame(df, geometry=geometry, crs="EPSG:4326")
return gdf
def build_gem_prod_data(fn):
df = pd.read_excel(fn, sheet_name="Gas extraction - main")
df = df.set_index("GEM Unit ID")
remove_country = ["Cyprus", "Türkiye"] # noqa: F841
remove_fuel_type = ["oil"] # noqa: F841
2024-01-03 07:13:01 +00:00
status_list = ["operating", "in development"] # noqa: F841
df = df.query(
"Status in @status_list \
& 'Fuel type' != 'oil' \
& Country != @remove_country \
& ~Latitude.isna() \
& ~Longitude.isna()"
).copy()
p = pd.read_excel(fn, sheet_name="Gas extraction - production")
p = p.set_index("GEM Unit ID")
p = p[p["Fuel description"].str.contains("gas")]
capacities = pd.DataFrame(index=df.index)
for key in ["production", "production design capacity", "reserves"]:
2024-01-03 07:13:01 +00:00
cap = (
p.loc[p["Production/reserves"] == key, "Quantity (converted)"]
.groupby("GEM Unit ID")
.sum()
.reindex(df.index)
)
# assume capacity such that 3% of reserves can be extracted per year (25% quantile)
2024-01-03 07:13:01 +00:00
annualization_factor = 0.03 if key == "reserves" else 1.0
capacities[key] = cap * annualization_factor
2024-01-03 07:13:01 +00:00
df["mcm_per_year"] = (
capacities["production"]
.combine_first(capacities["production design capacity"])
.combine_first(capacities["reserves"])
2024-01-03 07:13:01 +00:00
)
geometry = gpd.points_from_xy(df["Longitude"], df["Latitude"])
gdf = gpd.GeoDataFrame(df, geometry=geometry, crs="EPSG:4326")
return gdf
def build_gas_input_locations(gem_fn, entry_fn, sto_fn, countries):
# LNG terminals
lng = build_gem_lng_data(gem_fn)
# Entry points from outside the model scope
entry = read_scigrid_gas(entry_fn)
entry["from_country"] = entry.from_country.str.rstrip()
entry = entry.loc[
~(entry.from_country.isin(countries) & entry.to_country.isin(countries))
& ~entry.name.str.contains("Tegelen") # only take non-EU entries
| (entry.from_country == "NO") # malformed datapoint # entries from NO to GB
].copy()
2024-01-03 07:13:01 +00:00
sto = read_scigrid_gas(sto_fn)
remove_country = ["RU", "UA", "TR", "BY"] # noqa: F841
sto = sto.query("country_code not in @remove_country").copy()
# production sites inside the model scope
prod = build_gem_prod_data(gem_fn)
mcm_per_day_to_mw = 437.5 # MCM/day to MWh/h
mcm_per_year_to_mw = 1.199 # MCM/year to MWh/h
mtpa_to_mw = 1649.224 # mtpa to MWh/h
mcm_to_gwh = 11.36 # MCM to GWh
lng["capacity"] = lng["CapacityInMtpa"] * mtpa_to_mw
entry["capacity"] = entry["max_cap_from_to_M_m3_per_d"] * mcm_per_day_to_mw
prod["capacity"] = prod["mcm_per_year"] * mcm_per_year_to_mw
sto["capacity"] = sto["max_cushionGas_M_m3"] * mcm_to_gwh
lng["type"] = "lng"
entry["type"] = "pipeline"
prod["type"] = "production"
sto["type"] = "storage"
sel = ["geometry", "capacity", "type"]
return pd.concat([prod[sel], entry[sel], lng[sel], sto[sel]], ignore_index=True)
if __name__ == "__main__":
if "snakemake" not in globals():
2023-03-06 18:09:45 +00:00
from _helpers import mock_snakemake
snakemake = mock_snakemake(
"build_gas_input_locations",
clusters="128",
)
2024-02-12 10:53:20 +00:00
configure_logging(snakemake)
set_scenario_config(snakemake)
regions = load_bus_regions(
snakemake.input.regions_onshore, snakemake.input.regions_offshore
)
# add a buffer to eastern countries because some
# entry points are still in Russian or Ukrainian territory.
buffer = 9000 # meters
eastern_countries = ["FI", "EE", "LT", "LV", "PL", "SK", "HU", "RO"]
add_buffer_b = regions.index.str[:2].isin(eastern_countries)
regions.loc[add_buffer_b] = (
regions[add_buffer_b].to_crs(3035).buffer(buffer).to_crs(4326)
)
countries = regions.index.str[:2].unique().str.replace("GB", "UK")
gas_input_locations = build_gas_input_locations(
snakemake.input.gem,
snakemake.input.entry,
snakemake.input.storage,
countries,
)
gas_input_nodes = gpd.sjoin(gas_input_locations, regions, how="left")
gas_input_nodes.rename(columns={"name": "bus"}, inplace=True)
gas_input_nodes.to_file(snakemake.output.gas_input_nodes, driver="GeoJSON")
ensure_columns = ["lng", "pipeline", "production", "storage"]
gas_input_nodes_s = (
gas_input_nodes.groupby(["bus", "type"])["capacity"]
.sum()
.unstack()
.reindex(columns=ensure_columns)
)
gas_input_nodes_s.columns.name = "capacity"
gas_input_nodes_s.to_csv(snakemake.output.gas_input_nodes_simplified)