Abstract network update (#600)

* initial commit * updated Abstract and HyFeatures network objects to use new functions * bug fixes to get hyfeatures to run properly * updates to NHDNetwork and functions in AbstractNetwork * moved renaming param_df column into individual networks, removed cols from input argument for AbstractNetwork * move renaming dataframe columns and terminal codes/connections creation into read_geo_file function for HyFeatures * move functions from ..._preprocess.py files into the network objects as inherent functions * fixed errors in data_assimilation.update() function * t-route on larger hyfeature domain with hybrid routing (#602) * t-route on larger hyfeature domain with hybrid routing * remove debug line Co-authored-by: Dong Kim <[email protected]> * add 'RoutingScheme' subclass of AbstractNetwork to set MC/diffusive related variables * bug fixes to get test HYfeatures with MC only run working * move build_qlateral_array function from AbstractNetwork to individual networks * bug fixes to get NHDNetwork working with new configuration * modified routing classes to be separate from network classes * edited names of routing objects, consolidated inputs to nwm_route into fewer inputs * edits to diffusive routing * temporary fix for writing CHRTOUT files in serial rather than parallel * minor updates to previous push * Delete RoutingScheme.py * Delete nhd_preprocess.py * Delete hyfeature_preprocess.py * more updates to address comments above * deleted files * Fix troute-nwm package setup.cfg (#603) Make sure the setup.cfg knows how to properly find the actual package under the `src` dir. Otherwise, a standard install (`pip install troute-nwm/`) won't actually install the module source required (`-e` works/ed cause it just created a link to the src dir, but for actual packaging, it doesn't bundle the package code without this in the config. For reference, check out [this useful reference on src/ layouts](https://setuptools.pypa.io/en/latest/userguide/declarative_config.html#using-a-src-layout) * removed loading nhd_preprocess.py as this file was removed * reverse changes to compute_nhd_routing_v02 input arguments * edit to work with redesigned initial_warmstate_preprocess function * move build_forcing_sets() to AbstractNetwork. abstractnetwork_preprocess.py is no longer needed * Delete abstractnetwork_preprocess.py * initial commit * updated Abstract and HyFeatures network objects to use new functions * bug fixes to get hyfeatures to run properly * updates to NHDNetwork and functions in AbstractNetwork * moved renaming param_df column into individual networks, removed cols from input argument for AbstractNetwork * move renaming dataframe columns and terminal codes/connections creation into read_geo_file function for HyFeatures * move functions from ..._preprocess.py files into the network objects as inherent functions * fixed errors in data_assimilation.update() function * add 'RoutingScheme' subclass of AbstractNetwork to set MC/diffusive related variables * bug fixes to get test HYfeatures with MC only run working * move build_qlateral_array function from AbstractNetwork to individual networks * bug fixes to get NHDNetwork working with new configuration * modified routing classes to be separate from network classes * edited names of routing objects, consolidated inputs to nwm_route into fewer inputs * edits to diffusive routing * temporary fix for writing CHRTOUT files in serial rather than parallel * minor updates to previous push * Delete RoutingScheme.py * Delete nhd_preprocess.py * Delete hyfeature_preprocess.py * more updates to address comments above * removed loading nhd_preprocess.py as this file was removed * reverse changes to compute_nhd_routing_v02 input arguments * edit to work with redesigned initial_warmstate_preprocess function * move build_forcing_sets() to AbstractNetwork. abstractnetwork_preprocess.py is no longer needed --------- Co-authored-by: kumdonoaa <[email protected]> Co-authored-by: Dong Kim <[email protected]> Co-authored-by: Nels <[email protected]>
NOAA-OWP · Feb 16, 2023 · 01c713a · 01c713a
1 parent 4f13af1
commit 01c713a
Show file tree

Hide file tree

Showing 13 changed files with 1,852 additions and 2,446 deletions.
diff --git a/src/troute-network/troute/AbstractNetwork.py b/src/troute-network/troute/AbstractNetwork.py
diff --git a/src/troute-network/troute/AbstractRouting.py b/src/troute-network/troute/AbstractRouting.py
@@ -0,0 +1,323 @@
+from abc import ABC, abstractmethod
+import logging
+import yaml
+import json
+import xarray as xr
+import pandas as pd
+
+from troute.nhd_network import reverse_network
+from troute.nhd_network_utilities_v02 import organize_independent_networks, build_refac_connections
+
+LOG = logging.getLogger('')
+
+def read_diffusive_domain(domain_file):
+    '''
+    Read diffusive domain data from .ymal or .json file.
+    
+    Arguments
+    ---------
+    domain_file (str or pathlib.Path): Path of diffusive domain file
+    
+    Returns
+    -------
+    data (dict int: [int]): domain tailwater segments: list of segments in domain 
+                            (includeing tailwater segment) 
+    
+    '''
+    if domain_file[-4:] == "yaml":
+        with open(domain_file) as domain:
+            data = yaml.load(domain, Loader=yaml.SafeLoader)
+    else:
+        with open(domain_file) as domain:
+            data = json.load(domain)
+
+    return data
+
+def read_netcdf(geo_file_path):
+    '''
+    Open a netcdf file with xarray and convert to dataframe
+    
+    Arguments
+    ---------
+    geo_file_path (str or pathlib.Path): netCDF filepath
+    
+    Returns
+    -------
+    ds.to_dataframe() (DataFrame): netCDF contents
+    
+    Notes
+    -----
+    - When handling large volumes of netCDF files, xarray is not the most efficient.
+    
+    '''
+    with xr.open_dataset(geo_file_path) as ds:
+        return ds.to_dataframe()
+
+
+class AbstractRouting(ABC):
+    """
+    
+    """
+    __slots__ = ["hybrid_params", "_diffusive_domain", "_coastal_boundary_depth_df",
+                "_diffusive_network_data", "_topobathy_df", "_refactored_diffusive_domain",
+                "_refactored_diffusive_network_data", "_refactored_reaches", 
+                "_unrefactored_topobathy_df",]
+
+    def __init__(self):
+        """
+        
+        """
+        self._diffusive_domain                  = None
+        self._diffusive_network_data            = None
+        self._topobathy_df                      = pd.DataFrame()
+        self._unrefactored_topobathy_df         = pd.DataFrame() 
+        self._refactored_diffusive_domain       = None
+        self._refactored_diffusive_network_data = None   
+        self._refactored_reaches                = {}
+
+    @abstractmethod
+    def update_routing_domain(self, dataframe, connections):
+        pass
+
+    @property
+    @abstractmethod
+    def diffusive_network_data(self):
+        pass
+
+    @property
+    @abstractmethod
+    def topobathy_df(self):
+        pass
+
+    @property
+    @abstractmethod
+    def refactored_diffusive_domain(self):
+        pass
+
+    @property
+    @abstractmethod
+    def refactored_reaches(self):
+        pass
+
+    @property
+    @abstractmethod
+    def unrefactored_topobathy_df(self):
+        pass
+
+
+class MCOnly(AbstractRouting):
+
+    def __init__(self, _):
+        self.hybrid_params = None
+
+        super().__init__()
+
+    def update_routing_domain(self, dataframe, connections):
+        return dataframe, connections
+
+    @property
+    def diffusive_network_data(self):
+        return self._diffusive_network_data
+
+    @property
+    def topobathy_df(self):
+        return self._topobathy_df
+
+    @property
+    def refactored_diffusive_domain(self):
+        return self._refactored_diffusive_domain
+
+    @property
+    def refactored_reaches(self):
+        return self._refactored_reaches
+
+    @property
+    def unrefactored_topobathy_df(self):
+        return self._unrefactored_topobathy_df
+
+
+class MCwithDiffusive(AbstractRouting):
+
+    def __init__(self, hybrid_params):
+        self.hybrid_params = hybrid_params
+
+        super().__init__()
+
+    def update_routing_domain(self, dataframe, connections):
+        #==========================================================================
+        # build diffusive domain data and edit MC domain data for hybrid simulation
+        domain_file = self.hybrid_params.get("diffusive_domain", None)
+        self._diffusive_domain = read_diffusive_domain(domain_file)
+        self._diffusive_network_data = {}
+
+        rconn_diff0 = reverse_network(connections)
+
+        for tw in self._diffusive_domain:
+            mainstem_segs = self._diffusive_domain[tw]['links']
+            # we want mainstem_segs start at a mainstem link right after the upstream boundary mainstem link, which is
+            # in turn not under any waterbody. This boundary mainstem link should be turned into a tributary segment.
+            upstream_boundary_mainstem_link = self._diffusive_domain[tw]['upstream_boundary_link_mainstem']         
+            if upstream_boundary_mainstem_link[0] in mainstem_segs:
+                mainstem_segs.remove(upstream_boundary_mainstem_link[0])
+
+            # ===== build diffusive network data objects ==== 
+            self._diffusive_network_data[tw] = {}
+
+            # add diffusive domain segments
+            self._diffusive_network_data[tw]['mainstem_segs'] =  mainstem_segs
+
+            # diffusive domain tributary segments
+            trib_segs = []
+
+            for seg in mainstem_segs:
+                us_list = rconn_diff0[seg]
+                for u in us_list:
+                    if u not in mainstem_segs:
+                        trib_segs.append(u) 
+
+            self._diffusive_network_data[tw]['tributary_segments'] = trib_segs
+            # diffusive domain connections object
+            self._diffusive_network_data[tw]['connections'] = {k: connections[k] for k in (mainstem_segs + trib_segs)}       
+
+            # make sure that no downstream link below tw
+            self._diffusive_network_data[tw]['connections'][tw] = []
+
+            # diffusive domain reaches and upstream connections. 
+            # break network at tributary segments
+            _, reaches, rconn_diff = organize_independent_networks(
+                self._diffusive_network_data[tw]['connections'],
+                set(trib_segs),
+                set(),
+            )
+
+            self._diffusive_network_data[tw]['rconn'] = rconn_diff
+            self._diffusive_network_data[tw]['reaches'] = reaches[tw]
+
+            # RouteLink parameters
+            self._diffusive_network_data[tw]['param_df'] = dataframe.filter(
+                (mainstem_segs + trib_segs),
+                axis = 0,
+            )
+            self._diffusive_network_data[tw]['upstream_boundary_link'] = upstream_boundary_mainstem_link
+
+            # ==== remove diffusive domain segs from MC domain ====        
+            # drop indices from param_df
+            dataframe = dataframe.drop(mainstem_segs)
+
+            # remove keys from connections dictionary
+            for s in mainstem_segs:
+                connections.pop(s)
+
+            # update downstream connections of trib segs
+            for us in trib_segs:
+                connections[us] = []
+
+        return dataframe, connections
+
+    @property
+    def diffusive_network_data(self):
+        return self._diffusive_network_data
+
+    @property
+    def topobathy_df(self):
+        return self._topobathy_df
+
+    @property
+    def refactored_diffusive_domain(self):
+        return self._refactored_diffusive_domain
+
+    @property
+    def refactored_reaches(self):
+        return self._refactored_reaches
+
+    @property
+    def unrefactored_topobathy_df(self):
+        return self._unrefactored_topobathy_df
+
+
+class MCwithDiffusiveNatlXSectionNonRefactored(MCwithDiffusive):
+
+    def __init__(self, hybrid_params):
+
+        super().__init__(hybrid_params = hybrid_params)
+
+    @property
+    def topobathy_df(self):
+        if self._topobathy_df.empty:
+            topobathy_file = self.hybrid_params.get("topobathy_domain", None)
+            self._topobathy_df = read_netcdf(topobathy_file).set_index('link')
+            self._topobathy_df.index = self._topobathy_df.index.astype(int)
+        return self._topobathy_df
+
+
+class MCwithDiffusiveNatlXSectionRefactored(MCwithDiffusive):
+
+    def __init__(self, hybrid_params):
+
+        super().__init__(hybrid_params = hybrid_params)
+
+    @property
+    def topobathy_df(self):
+        if self._topobathy_df.empty:
+            refactored_topobathy_file = self.hybrid_params.get("refactored_topobathy_domain", None)
+            self._topobathy_df = read_netcdf(refactored_topobathy_file).set_index('link')
+        return self._topobathy_df
+
+    @property
+    def refactored_diffusive_domain(self):
+        if not self._refactored_diffusive_domain:
+            refactored_domain_file = self.hybrid_params.get("refactored_domain", None)
+            self._refactored_diffusive_domain = read_diffusive_domain(refactored_domain_file)
+        return self._refactored_diffusive_domain
+
+    @property
+    def refactored_reaches(self):
+        if not self._refactored_reaches:
+            refactored_topobathy_file = self.hybrid_params.get("refactored_topobathy_domain", None)
+            diffusive_parameters = {'geo_file_path': refactored_topobathy_file}
+            refactored_connections = build_refac_connections(diffusive_parameters)
+
+            for tw in self._diffusive_domain:
+
+                # list of stream segments of a single refactored diffusive domain 
+                refac_tw = self.refactored_diffusive_domain[tw]['refac_tw']
+                rlinks_tw = self.refactored_diffusive_domain[tw]['rlinks']
+                refactored_connections_tw = {}   
+
+                # Subset a connection dictionary (upstream segment as key : downstream segments as values) from refactored_connections
+                # for a single refactored diffusive domain defined by a current tw. 
+                for k in rlinks_tw:
+                    if k in refactored_connections.keys() and k != refac_tw:
+                        refactored_connections_tw[k] = refactored_connections[k]
+
+                trib_segs = self.diffusive_network_data[tw]['tributary_segments']
+                refactored_diffusive_network_data = {}
+                refactored_diffusive_network_data[refac_tw] = {}                
+                refactored_diffusive_network_data[refac_tw]['tributary_segments'] = trib_segs
+                refactored_diffusive_network_data[refac_tw]['connections'] = refactored_connections_tw                 
+
+                for k in trib_segs:
+                    refactored_diffusive_network_data[refac_tw]['connections'][k] = [self._refactored_diffusive_domain[tw]['incoming_tribs'][k]]
+
+                # diffusive domain reaches and upstream connections. 
+                # break network at tributary segments
+                _, refactored_reaches_batch, refactored_conn_diff = organize_independent_networks(
+                                                            refactored_diffusive_network_data[refac_tw]['connections'],
+                                                            set(trib_segs),
+                                                            set(),
+                                                            )
+
+                self._refactored_reaches[refac_tw] = refactored_reaches_batch[refac_tw]
+                refactored_diffusive_network_data[refac_tw]['mainstem_segs'] = self._refactored_diffusive_domain[tw]['rlinks']
+                refactored_diffusive_network_data[refac_tw]['upstream_boundary_link'] = self._diffusive_network_data[tw]['upstream_boundary_link']
+        return self._refactored_reaches
+
+    @property
+    def unrefactored_topobathy_df(self):
+        if self._unrefactored_topobathy_df.empty:
+            topobathy_file = self.hybrid_params.get("topobathy_domain",   None)
+            self._unrefactored_topobathy_df = read_netcdf(topobathy_file).set_index('link')
+            self._unrefactored_topobathy_df.index = self._unrefactored_topobathy_df.index.astype(int)
+        return self._unrefactored_topobathy_df
+
+