Last active
August 6, 2021 15:52
-
-
Save alorenzo175/d25293c4e47bec307ede7cd70022582c to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
""" | |
An example script to generate random forecasts for participants | |
in the first test trial of the Solar Forecast Arbiter. | |
This is meant to be explored and modified. A generation script | |
should be run periodically as a cronjob or via another scheduling | |
mechanism at an appropriate interval that will be determined by | |
the trial/forecast parameters. | |
""" | |
import logging | |
import sys | |
import numpy as np | |
import pandas as pd | |
from solarforecastarbiter.io import api | |
from solarforecastarbiter.reference_forecasts import utils | |
API_URL = 'https://api.solarforecastarbiter.org' | |
# Deterministic forecast UUIDs | |
FORECAST_UUIDS = [ | |
# the UUIDS of the relevant deterministic forecasts go here | |
] | |
# Probabilistic forecast group UUIDs | |
# a separate forecast for each constant value will | |
# be uploaded separately | |
PROBABILISTIC_FORECAST_UUIDS = [ | |
# The UUIDS of the relevant probabilistic forecast groups go here | |
] | |
if len(FORECAST_UUIDS) == 0 and len(PROBABILISTIC_FORECAST_UUIDS) == 0: | |
raise ValueError( | |
'Please edit FORECAST_UUIDS and PROBABILISTIC_FORECAST_UUIDS ' | |
'to add the appropriate UUIDS of the trial forecasts.') | |
# Edit this level to 'DEBUG' for more verbose logging | |
logging.basicConfig(level='INFO') | |
# here, we read the file provided as an argument to the script | |
# to get the username and password (separated by a new line). | |
# Alternatives include using environment variables or hardcoding the values | |
with open(sys.argv[1], 'r') as f: | |
username, password = f.read().split('\n')[:2] | |
# Setup an APISession to communicate with the solararbiter API | |
token = api.request_cli_access_token(username, password) | |
session = api.APISession(token, base_url=API_URL) | |
def list_forecasts_for_the_trial(session, string_in_extra_params): | |
"""Function that could be used to examine the all forecasts | |
and select the relevant forecasts based on the forecast | |
extra_parameters.""" | |
# Get information about the current user | |
user_info = session.get_user_info() | |
# Retrive all forecasts the user has access to | |
all_forecasts = session.list_forecasts() | |
# Filter out the forecasts not in the trial | |
# for the purposes of this trial, the trial name will | |
# appear in the extra_parameters section of the Forecast | |
trial_forecasts = filter( | |
lambda x: ( | |
string_in_extra_params in x.extra_parameters | |
) and ( | |
x.provider == user_info['organization'] | |
), | |
all_forecasts | |
) | |
return trial_forecasts | |
# go through each of our deterministic forecasts in the trial, | |
# generate random data, and upload to the API | |
for forecast_id in FORECAST_UUIDS: | |
forecast = session.get_forecast(forecast_id) | |
logging.info('Check if a forecast should be generated for %s', | |
forecast.name) | |
# set the run_time as now | |
run_time = pd.Timestamp.now(tz='UTC') | |
# From the forecast metadata, determine the next time | |
# the forecasts should be issued | |
issue_time = utils.get_next_issue_time( | |
forecast, run_time) | |
# if the next issue_time is not within 10 minutes of the | |
# current time, skip and move on to the next forecast | |
if (issue_time - run_time) > pd.Timedelta('10min'): | |
logging.info('Not yet time to generate forecast for %s. ' | |
'Next issue time is %s.', | |
forecast.name, issue_time) | |
continue | |
# Get the time range that we are expected to generate a | |
# forecast for. This includes an adjustment for the lead time | |
# before a forecast is valid. | |
start, end = utils.get_forecast_start_end(forecast, issue_time) | |
logging.info('Generating forecast for %s from %s to %s', | |
forecast.name, start, end) | |
# make the forecast, in this case just random numbers | |
# between 0 and 100 | |
# first, make the index ensuring closure is consistent with interval_label | |
if forecast.interval_label == 'ending': | |
index_closure = 'right' | |
else: | |
index_closure = 'left' | |
index = pd.date_range( | |
start=start, end=end, freq=forecast.interval_length, | |
closed=index_closure) | |
# now make the random series | |
forecast_series = pd.Series(np.random.randint(0, 100, len(index)), | |
index=index) | |
# upload the forecast to the API | |
# catch and log errors so we can try uplloading the other forecasts | |
try: | |
session.post_forecast_values(forecast.forecast_id, forecast_series) | |
except Exception: | |
logging.exception('Failed to upload forecast for %s', forecast.name) | |
continue | |
# Go through each probabilistic forecast group, get its metadata, | |
# and for each probabilistic constant value, generate and upload random data | |
for prob_forecast_id in PROBABILISTIC_FORECAST_UUIDS: | |
prob_forecast = session.get_probabilistic_forecast(prob_forecast_id) | |
logging.info( | |
'Check if a probabilistic forecast should be generated for %s', | |
prob_forecast.name) | |
run_time = pd.Timestamp.now(tz='UTC') | |
# From the forecast metadata, determine the next time | |
# the forecasts should be issued | |
issue_time = utils.get_next_issue_time( | |
prob_forecast, run_time) | |
# if the next issue_time is not within 10 minutes of the | |
# current time, skip and move on to the next forecast | |
if (issue_time - run_time) > pd.Timedelta('10min'): | |
logging.info('Not yet time to generate forecast for %s. ' | |
'Next issue time is %s.', | |
prob_forecast.name, issue_time) | |
continue | |
# Get the time range that we are expected to generate a | |
# forecast for. This includes an adjustment for the lead time | |
# before a forecast is valid. | |
start, end = utils.get_forecast_start_end(prob_forecast, issue_time) | |
logging.info('Generating forecast for %s from %s to %s', | |
prob_forecast.name, start, end) | |
# make an index that all prob. forecast constant values will share | |
# ensuring closure is consistent with interval_label | |
if prob_forecast.interval_label == 'ending': | |
index_closure = 'right' | |
else: | |
index_closure = 'left' | |
index = pd.date_range( | |
start=start, end=end, freq=prob_forecast.interval_length, | |
closed=index_closure) | |
# for each constant value, make a random timeseries and upload | |
# the timeseries for that constant value | |
for prob_constant_value in prob_forecast.constant_values: | |
# make the forecast, in this case just random numbers | |
# between 0 and 100 | |
forecast_series = pd.Series(np.random.randint(0, 100, len(index)), | |
index=index) | |
# upload the probalistic forecast constant value to the API | |
# catch and log errors so we can try uplloading the other forecasts | |
try: | |
session.post_probabilistic_forecast_constant_value_values( | |
prob_constant_value.forecast_id, forecast_series) | |
except Exception: | |
logging.exception( | |
'Failed to upload prob. forecast constant value for %s', | |
prob_constant_value.name) | |
continue |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment