Add FlexMeasures plugins, USEF protocol, and Cariflex simulator

- flexmeasures-entsoe: ENTSO-E data plugin
- flexmeasures-weather: Weather data plugin
- USEF Flex Trading Protocol PDF (2.4MB)
- Cariflex simulator (publishes to Redis)
- Dashboard Grafana updated with correct InfluxDB queries
- All tools extracted in /tools/
This commit is contained in:
Eric F
2026-06-08 07:38:57 -04:00
parent 3fb90a8033
commit d4974e3241
72 changed files with 5185 additions and 0 deletions

View File

@@ -0,0 +1,369 @@
from typing import Dict, Optional, Tuple, Union
from datetime import datetime, timedelta
from logging import Logger
from entsoe import EntsoePandasClient
from flask import current_app
from packaging import version
from pandas.tseries.frequencies import to_offset
import pandas as pd
import click
import pytz
import entsoe
from flexmeasures.data.utils import get_data_source, save_to_db
from flexmeasures import Asset, AssetType, Sensor, Source, __version__ as flexmeasures_version
from flexmeasures.data import db
from flexmeasures.utils.time_utils import server_now
from timely_beliefs import BeliefsDataFrame
from flexmeasures.cli.utils import MsgStyle
from . import (
DEFAULT_DATA_SOURCE_NAME,
DEFAULT_DERIVED_DATA_SOURCE,
DEFAULT_COUNTRY_CODE,
DEFAULT_COUNTRY_TIMEZONE,
) # noqa: E402
FM_SUPPORTS_ACCOUNT_LINKED_SOURCES = version.parse(
flexmeasures_version
) >= version.parse("0.32")
if FM_SUPPORTS_ACCOUNT_LINKED_SOURCES:
from flexmeasures import Account
from flexmeasures.data.services.data_sources import get_or_create_source
def _find_existing_source(source_name: str, source_type: str) -> Optional[Source]:
return (
Source.query.filter(
Source.name == source_name,
Source.type == source_type,
)
.order_by(Source.id)
.first()
)
def get_or_create_entsoe_account():
"""Make sure we have an account for the ENTSO-E provider service."""
account_name = current_app.config.get(
"ENTSOE_DATA_SOURCE_NAME", DEFAULT_DATA_SOURCE_NAME
)
entsoe_account = Account.query.filter(
Account.name == account_name,
).one_or_none()
if entsoe_account is None:
entsoe_account = Account(name=account_name)
db.session.add(entsoe_account)
db.session.flush()
return entsoe_account
def _ensure_entsoe_source(
source_name: str,
source_type: str,
legacy_source_type: Optional[str] = None,
) -> Source:
"""Reuse legacy sources when possible while branching explicitly on FM version."""
entsoe_account = None
if FM_SUPPORTS_ACCOUNT_LINKED_SOURCES:
entsoe_account = get_or_create_entsoe_account()
existing_source = _find_existing_source(source_name, source_type)
if existing_source is None and legacy_source_type is not None:
existing_source = _find_existing_source(source_name, legacy_source_type)
if existing_source is not None:
existing_source.type = source_type
if existing_source is not None:
if entsoe_account is not None and getattr(existing_source, "account", None) is None:
existing_source.account = entsoe_account
return existing_source
if not FM_SUPPORTS_ACCOUNT_LINKED_SOURCES:
return get_data_source(
data_source_name=source_name,
data_source_type=source_type,
)
source_kwargs = dict(
source=source_name,
source_type=source_type,
flush=False,
)
if entsoe_account is not None:
source_kwargs["account"] = entsoe_account
return get_or_create_source(**source_kwargs)
def ensure_data_source() -> Source:
"""Make sure we have a raw ENTSO-E data source of type "market"."""
return _ensure_entsoe_source(
source_name=current_app.config.get(
"ENTSOE_DATA_SOURCE_NAME", DEFAULT_DATA_SOURCE_NAME
),
source_type="market",
legacy_source_type="forecasting script",
)
def ensure_data_source_for_derived_data() -> Source:
"""Make sure we have a data source for data derived from ENTSO-E data."""
return _ensure_entsoe_source(
source_name=current_app.config.get(
"ENTSOE_DERIVED_DATA_SOURCE", DEFAULT_DERIVED_DATA_SOURCE
),
source_type="forecasting script",
)
def ensure_transmission_zone_asset(country_code: str) -> Asset:
"""
Ensure a GenericAsset exists to model the transmission zone for which this plugin gathers data.
"""
transmission_zone_type = AssetType.query.filter(
AssetType.name == "transmission zone"
).one_or_none()
if not transmission_zone_type:
current_app.logger.info("Adding transmission zone type ...")
transmission_zone_type = AssetType(
name="transmission zone",
description="A grid regulated & balanced as a whole, usually a national grid.",
)
db.session.add(transmission_zone_type)
ga_name = f"{country_code} transmission zone"
transmission_zone = Asset.query.filter(Asset.name == ga_name).one_or_none()
if not transmission_zone:
current_app.logger.info(f"Adding {ga_name} ...")
transmission_zone = Asset(
name=ga_name,
generic_asset_type=transmission_zone_type,
account_id=None, # public
)
db.session.add(transmission_zone)
db.session.commit()
return transmission_zone
def ensure_sensors(
sensor_specifications: Tuple,
country_code: str,
timezone: str,
) -> Dict[str, Sensor]:
"""
Ensure a GenericAsset exists to model the transmission zone for which this plugin gathers
generation data, then add specified sensors for relevant data we collect.
If new sensors got created, the session has been flushed.
"""
sensors = {}
sensors_created: bool = False
transmission_zone = ensure_transmission_zone_asset(country_code)
for sensor_name, unit, event_resolution, data_by_entsoe in sensor_specifications:
sensor = Sensor.query.filter(
Sensor.name == sensor_name,
Sensor.unit == unit,
Sensor.generic_asset == transmission_zone,
).one_or_none()
if not sensor:
current_app.logger.info(f"Adding sensor {sensor_name} ...")
sensor = Sensor(
name=sensor_name,
unit=unit,
generic_asset=transmission_zone,
timezone=timezone,
event_resolution=event_resolution,
)
db.session.add(sensor)
sensors_created = True
elif sensor.event_resolution != event_resolution:
current_app.logger.warning(
f"The {sensor_name} sensor exists, but has a resolution of {sensor.event_resolution} instead of {event_resolution}. Please refer the 'October 1st 2025 go-live' instructions in `README.md`."
)
sensor.data_by_entsoe = data_by_entsoe
sensors[sensor_name] = sensor
if sensors_created:
db.session.flush()
return sensors
def get_auth_token_from_config_and_set_server_url() -> str:
"""
Read ENTSOE auth token from config, raise if not given.
If test server is supposed to be used, we'll try to read the token
usable for that, and also change the URL.
"""
use_test_server = current_app.config.get("ENTSOE_USE_TEST_SERVER", False)
if use_test_server:
auth_token = current_app.config.get("ENTSOE_AUTH_TOKEN_TEST_SERVER")
entsoe.entsoe.URL = "https://iop-transparency.entsoe.eu/api"
else:
auth_token = current_app.config.get("ENTSOE_AUTH_TOKEN")
entsoe.entsoe.URL = "https://web-api.tp.entsoe.eu/api"
if not auth_token:
click.echo("Setting ENTSOE_AUTH_TOKEN seems empty!")
raise click.Abort
return auth_token
def ensure_country_code_and_timezone(
country_code: Optional[str] = None,
country_timezone: Optional[str] = None,
) -> Tuple[str, str]:
if country_code is None:
country_code = current_app.config.get(
"ENTSOE_COUNTRY_CODE", DEFAULT_COUNTRY_CODE
)
if country_timezone is None:
country_timezone = current_app.config.get(
"ENTSOE_COUNTRY_TIMEZONE", DEFAULT_COUNTRY_TIMEZONE
)
return country_code, country_timezone
def create_entsoe_client() -> EntsoePandasClient:
auth_token = get_auth_token_from_config_and_set_server_url()
client = EntsoePandasClient(api_key=auth_token)
return client
def abort_if_data_empty(data: Union[pd.DataFrame, pd.Series]):
if data.empty:
click.echo(
"Result is empty. Probably ENTSO-E does not provide these forecasts yet ..."
)
raise click.Abort
def abort_if_data_incomplete(
data: Union[pd.DataFrame, pd.Series],
from_time: pd.Timestamp,
until_time: pd.Timestamp,
resolution: pd.Timedelta,
):
expected_periods = int((until_time - from_time) / resolution)
if len(data) < expected_periods:
click.secho(
f"Result is incomplete. Expected {expected_periods} periods but got {len(data)}. Probably ENTSO-E does not provide these forecasts yet ...",
**MsgStyle.ERROR,
)
raise click.Abort
def parse_from_and_to_dates(
from_date: Optional[datetime],
until_date: Optional[datetime],
country_timezone: str,
default_to: str = "today-and-tomorrow", # Can be "tomorrow" or "today"
) -> Tuple[pd.Timestamp, pd.Timestamp]:
"""
Parse CLI options for start and end date (or set default to today and tomorrow) for inout to entsoe-py
Note: we expect only dates as input here, and until_date is inclusive, so we extend it with 24h - so if from_date is equal to until_date, we return 00:00 and 24:00 of that day.
Note: entsoe-py expects time params as pd.Timestamp
"""
tz = pytz.timezone(country_timezone)
now = datetime.now(tz)
today_start = now.replace(hour=0, minute=0, second=0, microsecond=0)
if default_to == "today":
default_start = today_start
default_end = today_start + timedelta(days=1)
elif default_to == "tomorrow":
default_start = today_start + timedelta(days=1)
default_end = default_start + timedelta(days=1)
elif default_to == "today-and-tomorrow":
default_start = today_start
default_end = default_start + timedelta(days=2)
else:
raise ValueError(
f"Invalid default_to value: {default_to}. Expected 'today', 'tomorrow' or 'today-and-tomorrow'."
)
if from_date is None:
start_date = pd.Timestamp(default_start)
else:
start_date = pd.Timestamp(from_date, tzinfo=pytz.timezone(country_timezone))
if until_date is None:
end_date = pd.Timestamp(default_end)
else:
end_date = pd.Timestamp(until_date, tzinfo=pytz.timezone(country_timezone))
# The until_date provided is considered inclusive, so we add 24 hours to include the entire day
end_date += pd.Timedelta(hours=24)
return start_date, end_date
def resample_if_needed(s: pd.Series, sensor: Sensor) -> pd.Series:
inferred_frequency = pd.infer_freq(s.index)
if inferred_frequency is None:
raise ValueError(
"Data has no discernible frequency from which to derive an event resolution."
)
inferred_resolution = pd.to_timedelta(to_offset(inferred_frequency))
target_resolution = sensor.event_resolution
if inferred_resolution == target_resolution:
return s
elif inferred_resolution > target_resolution:
current_app.logger.debug(f"Upsampling data for {sensor.name} ...")
index = pd.date_range(
s.index[0],
s.index[-1] + inferred_resolution,
freq=target_resolution,
inclusive="left",
)
s = s.reindex(index).pad()
elif inferred_resolution < target_resolution:
current_app.logger.debug(f"Downsampling data for {sensor.name} ...")
s = s.resample(target_resolution).mean()
current_app.logger.debug(f"Resampled data for {sensor.name}: \n%s" % s)
return s
def save_entsoe_series(
series: pd.Series,
sensor: Sensor,
entsoe_source: Source,
country_timezone: str,
now: Optional[datetime] = None,
):
"""
Save a series gotten from ENTSO-E to a FlexMeasures database.
"""
if not now:
now = server_now().astimezone(pytz.timezone(country_timezone))
belief_times = (
(series.index.floor("D") - pd.Timedelta("6h"))
.to_frame(name="clipped_belief_times")
.clip(upper=now)
.set_index("clipped_belief_times")
.index
) # published no later than D-1 18:00 Brussels time
bdf = BeliefsDataFrame(
series,
source=entsoe_source,
sensor=sensor,
belief_time=belief_times,
)
# TODO: evaluate some traits of the data via FlexMeasures, see https://github.com/SeitaBV/flexmeasures-entsoe/issues/3
status = save_to_db(bdf)
if status == "success_but_nothing_new":
current_app.logger.info("Done. These beliefs had already been saved before.")
elif status == "success_with_unchanged_beliefs_skipped":
current_app.logger.info("Done. Some beliefs had already been saved before.")
def start_import_log(
import_type: str,
from_time: pd.Timestamp,
until_time: pd.Timestamp,
country_code: str,
country_timezone: str,
) -> Tuple[Logger, datetime]:
log = current_app.logger
log.info(
f"Importing {import_type} data for {country_code} (timezone {country_timezone}), starting at {from_time}, up until {until_time}, from ENTSO-E at {entsoe.entsoe.URL} ..."
)
now = server_now().astimezone(pytz.timezone(country_timezone))
return log, now