Source code for herbie.latest

"""Herbie Helpers to get the latest model grid."""

import time

import pandas as pd

from herbie import Herbie, config


[docs] def HerbieLatest( model=config["default"].get("model"), priority=["aws", "nomads"], periods=4, **kwargs, ): r"""Find the latest model data. Parameters ---------- model : str The name of the model. priority : list The sources to look for data. The default value `["aws", "nomads"]` was chosen because it is a reasonable priority order for many of the models available from the NODD program (NOAA models like HRRR, GFS, GEFS, etc.) The data for these models will be made available on NOMADS first, but I also know AWS gets the data pretty quick. So, check AWS first, then check NOMADS (because if you make too many downloads from NOMADS your IP address will get blocked.) **kwargs Any other input you want passed to the Herbie class. """ if model.lower() in ["hrrr", "rap", "rrfs"]: freq = "1h" else: freq = "6h" # Create a list of recent dates to try dates = pd.date_range( pd.Timestamp.utcnow().floor(freq).tz_localize(None), periods=4, freq=f"-{freq}", ) # Find first existing Herbie object for date in dates: H = Herbie(date=date, model=model, priority=priority, **kwargs) if H.grib: return H raise TimeoutError(f"Herbie did not find data for the latest time: {H}")
[docs] def HerbieWait( model=config["default"].get("model"), priority=["aws", "nomads"], wait_for="5min", check_interval="15s", **kwargs, ): """Wait for the latest model grid to become available. Parameters ---------- model : str The name of the model. priority : list The sources to look for data. The default value `["aws", "nomads"]` was chosen because it is a reasonable priority order for many of the models available from the NODD program (NOAA models like HRRR, GFS, GEFS, etc.) The data for these models will be made available on NOMADS first, but I also know AWS gets the data pretty quick. So, check AWS first, then check NOMADS (because if you make too many downloads from NOMADS your IP address will get blocked.) wait_for : timedelta or Pandas-parsable Timedelta str Length of time Herbie will wait for data. check_every : int (seconds), timedelta, Pandas-parsable Timedelta str Frequency Herbie will look for data again, as a pandas-parsable timedelta string (e.g., '30s') or an int representing seconds. **kwargs Any other input you want passed to the Herbie class. """ now = pd.Timestamp.utcnow().floor("1h").tz_localize(None) if isinstance(check_interval, str): check_interval = pd.Timedelta(check_interval).total_seconds() timer = pd.Timestamp("now") H = Herbie(now, model=model, priority=priority, **kwargs) while H.grib is None: now = pd.Timestamp.utcnow().floor("1h").tz_localize(None) H = Herbie(now, model=model, priority=priority, **kwargs) if H.grib: return H time.sleep(check_interval) if (pd.Timestamp("now") - timer) >= pd.Timedelta(wait_for): break raise TimeoutError(f"Herbie did not find data in time: {H}")