HydrologicEngineeringCenter · Enovotny · Apr 20, 2026 · Apr 21, 2026 · Apr 21, 2026 · krowvin
@@ -41,8 +41,17 @@ def usgs_group():
     type=str,
     help='Backfill timeseries ids, use list of timeseries ids (e.g. "ts_id1, ts_id2") to attempt to backfill a subset of timeseries with USGS data',
 )
+@click.option(
+    "-bv",
+    "--backfill-version",
+    default=None,
+    type=str,
+    help='Backfill version, save data to a different version of the timeseries (e.g. "Rev-USGS" instead of "Raw-USGS")',
+)
 @requires(reqs.cwms, reqs.requests)
-def getusgs_timeseries(office, days_back, api_root, api_key, api_key_loc, backfill):
+def getusgs_timeseries(
+    office, days_back, api_root, api_key, api_key_loc, backfill, backfill_version
+):
     from cwmscli.usgs.getusgs_cda import getusgs_cda
 
     if backfill is not None:
@@ -57,6 +66,52 @@ def getusgs_timeseries(office, days_back, api_root, api_key, api_key_loc, backfi
         days_back=days_back,
         api_key=api_key,
         backfill_tsids=backfill_list,
+        backfill_version=backfill_version,
+    )
+
+
+@usgs_group.command(
+    "timeseries-v2",
+    help="Get USGS timeseries values using the new OGC API and store into CWMS database",
+)
+@office_option
+@days_back_option
+@api_root_option
+@api_key_option
+@api_key_loc_option
+@click.option(
+    "-b",
+    "--backfill",
+    default=None,
+    type=str,
+    help='Backfill timeseries ids, use list of timeseries ids (e.g. "ts_id1, ts_id2") to attempt to backfill a subset of timeseries with USGS data',
+)
+@click.option(
+    "-bv",
+    "--backfill-version",
+    default=None,
+    type=str,
+    help='Backfill version, save data to a different version of the timeseries (e.g. "Rev-USGS" instead of "Raw-USGS")',
+)
+@requires(reqs.cwms, reqs.requests)
+def getusgs_timeseries_v2(
+    office, days_back, api_root, api_key, api_key_loc, backfill, backfill_version
+):
+    from cwmscli.usgs.getusgs_cda import getusgs_cda_ogc
+
+    if backfill is not None:
+        backfill_list = [item.strip() for item in backfill.split(",") if item.strip()]
+    else:
+        backfill_list = None
+
+    api_key = get_api_key(api_key, api_key_loc)
+    getusgs_cda_ogc(
+        api_root=api_root,
+        office_id=office,
+        days_back=days_back,
+        api_key=api_key,
+        backfill_tsids=backfill_list,
+        backfill_version=backfill_version,
     )
 
 

@@ -46,6 +46,7 @@ def getusgs_cda(
     days_back: float,
     api_key: str,
     backfill_tsids: list = None,
+    backfill_version: str = None,
 ):
     api_key = "apikey " + api_key
     cwms.api.init_session(api_root=api_root, api_key=api_key)
@@ -60,6 +61,10 @@ def getusgs_cda(
     if backfill_tsids:
         USGS_ts = USGS_ts[USGS_ts["timeseries-id"].isin(backfill_tsids)]
 
+    USGS_ts = _validate_backfill_version_timeseries(
+        USGS_ts, backfill_version, office_id
+    )
+
     if len(USGS_ts) > 0:
         # grab all of the unique USGS stations numbers to be sent to USGS api
         sites = USGS_ts[USGS_ts["USGS_Method_TS"].isna()].USGS_St_Num.unique()
@@ -88,7 +93,9 @@ def getusgs_cda(
         if len(method_sites) > 0:
             USGS_data_method = getUSGS_ts(method_sites, startDT, endDT, 3)
 
-        CWMS_writeData(USGS_ts, USGS_data, USGS_data_method, days_back)
+        CWMS_writeData(
+            USGS_ts, USGS_data, USGS_data_method, days_back, backfill_version
+        )
     else:
         if backfill_tsids:
             _log_error_and_exit(
@@ -134,6 +141,9 @@ def get_USGS_params():
     return USGS_Params
 
 
+_USGS_PARAMS = get_USGS_params()
+
+
 def get_CMWS_TS_Loc_Data(office):
     """
     get time series group and location alias information and combine into singe dataframe
@@ -143,8 +153,8 @@ def get_CMWS_TS_Loc_Data(office):
     def find_usgsparam(attribute, param):
         if attribute > 0:
             usgs_param = str(attribute).split(".")[0]
-        elif param in USGS_Params.index:
-            usgs_param = USGS_Params.at[param, "USGS_PARAMETER"]
+        elif param in _USGS_PARAMS.index:
+            usgs_param = _USGS_PARAMS.at[param, "USGS_PARAMETER"]
         else:
             usgs_param = "Not Found"
         return usgs_param
@@ -236,7 +246,6 @@ def find_usgsparam(attribute, param):
             [USGS_ts[USGS_ts["USGS_St_Num"].notnull()], USGS_ts_base], axis=0
         )
 
-    USGS_Params = get_USGS_params()
     # this code fills in the USGS_Params field with values in the Time Series Group Attribute if it exists.  If it does not exist it
     # grabs the default USGS paramter for the coresponding CWMS parameter
     USGS_ts.attribute = USGS_ts.apply(
@@ -269,6 +278,7 @@ def getUSGS_ts(sites, startDT, endDT, access=None):
         # "modifiedSince": "PT6H",
         "siteStatus": "active",
     }
+    query_dict = {k: v for k, v in query_dict.items() if v is not None}
 
     r = requests.get(base_url, params=query_dict).json()
 
@@ -285,7 +295,63 @@ def getUSGS_ts(sites, startDT, endDT, access=None):
     return USGS_data
 
 
-def CWMS_writeData(USGS_ts, USGS_data, USGS_data_method, days_back):
+def _replace_ts_version(ts_id: str, backfill_version: str) -> str:
+    """Replace the version component of a timeseries ID.
+
+    The last dot-separated component is the version (e.g., Raw-USGS, Rev-USGS).
+    This function replaces it with the provided backfill_version.
+    """
+    parts = ts_id.rsplit(".", 1)
+    if len(parts) == 2:
+        return f"{parts[0]}.{backfill_version}"
+    return ts_id
+
+
+def _validate_backfill_version_timeseries(
+    usgs_ts: pd.DataFrame, backfill_version: str, office_id: str
+) -> pd.DataFrame:
+    """Validate that all timeseries with backfill_version exist in CWMS.
+
+    Returns dataframe with missing backfill_version timeseries removed.
+    """
+    if backfill_version is None:
+        return usgs_ts
+
+    try:
+        pattern = f".*\\.{backfill_version}$"
+        response = cwms.get_timeseries_identifiers(
+            office_id=office_id, timeseries_id_regex=pattern
+        )
+
+        existing_ts = set()
+        if response.df is not None and not response.df.empty:
+            existing_ts = set(response.df["timeseries-id"].values)
+
+        missing_ts = []
+        missing_original_ts = []
+        for ts_id in usgs_ts["timeseries-id"].unique():
+            new_ts_id = _replace_ts_version(ts_id, backfill_version)
+            if new_ts_id not in existing_ts:
+                missing_ts.append(new_ts_id)
+                missing_original_ts.append(ts_id)
+
+        if missing_ts:
+            logging.warning(
+                f"The following timeseries with backfill_version '{backfill_version}' do not exist in CWMS and will be skipped: {missing_ts}"
+            )
+            usgs_ts = usgs_ts[~usgs_ts["timeseries-id"].isin(missing_original_ts)]
+
+    except Exception as e:
+        logging.warning(
+            f"Could not verify timeseries with backfill_version for office {office_id}: {e}"
+        )
+
+    return usgs_ts
+
+
+def CWMS_writeData(
+    USGS_ts, USGS_data, USGS_data_method, days_back, backfill_version=None
+):
     # lists to hold time series that fail
     # noData -> usgs location and parameter were present in USGS api but the values were empty
     # NotinAPI -> usgs location and parameter were not retrieved from USGS api
@@ -371,10 +437,20 @@ def CWMS_writeData(USGS_ts, USGS_data, USGS_data_method, days_back):
                         office = row["office-id"]
                         values["quality-code"] = 0
 
+                        # apply backfill_version if provided
+                        store_ts_id = (
+                            _replace_ts_version(ts_id, backfill_version)
+                            if backfill_version
+                            else ts_id
+                        )
+
                         # write values to CWMS database
                         try:
                             data = cwms.timeseries_df_to_json(
-                                data=values, ts_id=ts_id, units=units, office_id=office
+                                data=values,
+                                ts_id=store_ts_id,
+                                units=units,
+                                office_id=office,
                             )
                             if days_back < 365:
                                 cwms.store_timeseries(data)
@@ -383,13 +459,13 @@ def CWMS_writeData(USGS_ts, USGS_data, USGS_data_method, days_back):
                                     data, max_workers=30, chunk_size=30 * 24 * 4
                                 )
                             logging.info(
-                                f"SUCCESS Data stored in CWMS database for -->  {ts_id},{USGS_Id_param}"
+                                f"SUCCESS Data stored in CWMS database for -->  {store_ts_id},{USGS_Id_param}"
                             )
                             saved = saved + 1
                         except Exception as error:
                             storErr.append([ts_id, USGS_Id_param, error])
                             logging.error(
-                                f"FAIL Data could not be stored to CWMS database for -->  {ts_id},{USGS_Id_param} CDA error = {error}"
+                                f"FAIL Data could not be stored to CWMS database for -->  {store_ts_id},{USGS_Id_param} CDA error = {error}"
                             )
             except Exception as error:
                 logging.error(
@@ -414,3 +490,83 @@ def CWMS_writeData(USGS_ts, USGS_data, USGS_data_method, days_back):
     logging.info(
         f"The following ts_ids errored because multiple method TSID were present for the USGS station. A USGS method TSID needs to be defined in the time series group in CWMS or an incorrect TSID is defined. {mult_ids}"
     )
+
+
+_OGC_BASE_URL = "https://api.waterdata.usgs.gov/ogcapi/v0/collections/continuous"
+
+
+def getUSGS_ts_ogc(sites, startDT, endDT, access=None):
+    """Fetch USGS instantaneous values from the OGC API endpoint.
+
+    Produces the same DataFrame structure as getUSGS_ts() so CWMS_writeData() works unchanged.
+
+    TODO: fill in OGC response parsing once sample JSON is available.
+    """
+    raise NotImplementedError(
+        "getUSGS_ts_ogc() is not yet implemented. "
+        "OGC API response parsing is pending. Use 'usgs timeseries' for the legacy endpoint."
+    )
+
+
+def getusgs_cda_ogc(
+    api_root: str,
+    office_id: str,
+    days_back: float,
+    api_key: str,
+    backfill_tsids: list = None,
+    backfill_version: str = None,
+):
+    """Fetch USGS time series data using the new OGC API and store into CWMS.
+
+    This is the OGC API variant of getusgs_cda(). The shared data fetching and writing
+    logic (get_CMWS_TS_Loc_Data, CWMS_writeData) is reused unchanged.
+    """
+    api_key = "apikey " + api_key
+    cwms.api.init_session(api_root=api_root, api_key=api_key)
+    logging.info(f"CDA connection: {api_root}")
+    logging.info(
+        f"Data will be grabbed and stored from USGS OGC API for past {days_back} days for office: {office_id}"
+    )
+    execution_date = datetime.now()
+
+    USGS_ts = get_CMWS_TS_Loc_Data(office_id)
+
+    if backfill_tsids:
+        USGS_ts = USGS_ts[USGS_ts["timeseries-id"].isin(backfill_tsids)]
+
+    USGS_ts = _validate_backfill_version_timeseries(
+        USGS_ts, backfill_version, office_id
+    )
+
+    if len(USGS_ts) > 0:
+        sites = USGS_ts[USGS_ts["USGS_Method_TS"].isna()].USGS_St_Num.unique()
+        method_sites = USGS_ts[USGS_ts["USGS_Method_TS"].notna()].USGS_St_Num.unique()
+        logging.info(f"Execution date {execution_date}")
+
+        tw_delta = -timedelta(days_back)
+        startDT = execution_date + tw_delta
+        endDT = execution_date + timedelta(hours=2)
+
+        logging.info(f"Grabbing data from USGS OGC API between {startDT} and {endDT}")
+
+        USGS_data = pd.DataFrame()
+        USGS_data_method = pd.DataFrame()
+
+        if len(sites) > 0:
+            USGS_data = getUSGS_ts_ogc(sites, startDT, endDT)
+        if len(method_sites) > 0:
+            USGS_data_method = getUSGS_ts_ogc(method_sites, startDT, endDT, 3)
+
+        CWMS_writeData(
+            USGS_ts, USGS_data, USGS_data_method, days_back, backfill_version
+        )
+    else:
+        if backfill_tsids:
+            _log_error_and_exit(
+                f"The following backfill time series ids were not present in the USGS time series or location alias groups: {backfill_tsids}"
+            )
+        else:
+            _log_error_and_exit(
+                f"No eligible USGS time series were found for office {office_id}.",
+                "Confirm that time series exist in Data Acquisition / USGS TS Data Acquisition and that matching entries exist in Agency Aliases / USGS Station Number.",
+            )