<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="research-article">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">HESS</journal-id><journal-title-group>
    <journal-title>Hydrology and Earth System Sciences</journal-title>
    <abbrev-journal-title abbrev-type="publisher">HESS</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Hydrol. Earth Syst. Sci.</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1607-7938</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/hess-30-3425-2026</article-id><title-group><article-title>Symbolic regression-based regionalization of baseflow separation parameter using catchment-scale characteristics</article-title><alt-title>Symbolic regression-based regionalization of baseflow separation parameter</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff3">
          <name><surname>Lin</surname><given-names>Yongen</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="yes" rid="aff1 aff2 aff3">
          <name><surname>Wang</surname><given-names>Dagang</given-names></name>
          <email>wangdag@mail.sysu.edu.cn</email>
        <ext-link>https://orcid.org/0000-0002-6424-6398</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3">
          <name><surname>Mei</surname><given-names>Yiwen</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-3326-8287</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff3">
          <name><surname>Zhu</surname><given-names>Jinxin</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-3248-7410</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4 aff5">
          <name><surname>Wu</surname><given-names>Huan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff6">
          <name><surname>Wang</surname><given-names>Shuo</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-7827-187X</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff7">
          <name><surname>Xu</surname><given-names>Zhonghou</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" deceased="yes" corresp="no" rid="aff8">
          <name><surname>Shamseldin</surname><given-names>Asaad Y.</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff9">
          <name><surname>Anagnostou</surname><given-names>Emmanouil N.</given-names></name>
          
        </contrib>
        <aff id="aff1"><label>1</label><institution>School of Geography and Planning, Sun Yat-sen University, Guangzhou, China</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>Guangdong Key Laboratory for Urbanization and Geo-simulation, Sun Yat-sen University, Guangzhou, China</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>Carbon-Water Research Station in Karst Regions of Northern Guangdong, Sun Yat-sen University, Guangzhou, China</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>School of Atmospheric Science, Sun Yat-sen University, Zhuhai, Guangdong, China</institution>
        </aff>
        <aff id="aff5"><label>5</label><institution>State Key Laboratory of Climate System Prediction and Risk Management, Nanjing University of Information Science and Technology, Nanjing, China</institution>
        </aff>
        <aff id="aff6"><label>6</label><institution>Department of Land Surveying and Geo-informatics, Hong Kong Polytechnic University, Kowloon, Hong Kong Special Administrative Region, China</institution>
        </aff>
        <aff id="aff7"><label>7</label><institution>Earth Sciences New Zealand, Hamilton 3216, New Zealand</institution>
        </aff>
        <aff id="aff8"><label>8</label><institution>Department of Civil and Environmental Engineering, The University of Auckland, Auckland 1010, New Zealand</institution>
        </aff>
        <aff id="aff9"><label>9</label><institution>Department of Civil and Environmental Engineering, University of Connecticut, Storrs, USA</institution>
        </aff><author-comment content-type="deceased"><p/></author-comment>
      </contrib-group>
      <author-notes><corresp id="corr1">Dagang Wang (wangdag@mail.sysu.edu.cn)</corresp></author-notes><pub-date><day>3</day><month>June</month><year>2026</year></pub-date>
      
      <volume>30</volume>
      <issue>11</issue>
      <fpage>3425</fpage><lpage>3438</lpage>
      <history>
        <date date-type="received"><day>3</day><month>December</month><year>2025</year></date>
           <date date-type="rev-request"><day>12</day><month>December</month><year>2025</year></date>
           <date date-type="rev-recd"><day>17</day><month>May</month><year>2026</year></date>
           <date date-type="accepted"><day>18</day><month>May</month><year>2026</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 Yongen Lin et al.</copyright-statement>
        <copyright-year>2026</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026.html">This article is available from https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026.html</self-uri><self-uri xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026.pdf">The full text article is available as a PDF file from https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e214">Accurate separation of baseflow from streamflow is of utmost importance for understanding catchment hydrological processes and supporting effective water resource management. The Smooth Minima Method is a common baseflow separation technique with a segment length parameter (<inline-formula><mml:math id="M1" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>) representing the catchment average flow event duration. <inline-formula><mml:math id="M2" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> is usually predicted by a power function with catchment area or defaults to 5 d. Yet these estimations are insufficient given the multivariate nature of <inline-formula><mml:math id="M3" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> with other catchment attributes. In this study, we employ symbolic regression (SR) to search for possible formulation of <inline-formula><mml:math id="M4" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> with a range of catchment attributes based on 855 catchments across the Contiguous United States. We ultimately identify three mathematical expressions of increasing complexity, achieving <inline-formula><mml:math id="M5" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> values of 0.48, 0.52, and 0.55, compared to 0.23 and <inline-formula><mml:math id="M6" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>0.84 for the power function and constant values. The three expressions reveal that <inline-formula><mml:math id="M7" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> increases following a power-law relationship with catchment area (<inline-formula><mml:math id="M8" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>) and catchment-averaged soil saturated hydraulic conductivity (<inline-formula><mml:math id="M9" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) with decreasing rates, while it increases linearly with snow day fraction (<inline-formula><mml:math id="M10" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>). The effects of <inline-formula><mml:math id="M11" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M12" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> on <inline-formula><mml:math id="M13" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> are particularly pronounced for larger values (<inline-formula><mml:math id="M14" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&gt;</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">25</mml:mn></mml:mrow></mml:math></inline-formula> mm h<sup>−1</sup> and <inline-formula><mml:math id="M16" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&gt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">0.4</mml:mn></mml:mrow></mml:math></inline-formula>) and smaller area (<inline-formula><mml:math id="M17" display="inline"><mml:mrow><mml:mi>A</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mo>&lt;</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">100</mml:mn></mml:mrow></mml:math></inline-formula> km<sup>2</sup>). The different calculations of <inline-formula><mml:math id="M19" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> are also evaluated in baseflow separation, revealing higher medians of Kling-Gupta Efficiency of at least 0.84, outperforming the literature-suggested formulas for a maximum increment of 0.22. This study highlights the potential of SR for uncovering physically meaningful formulas in optimal baseflow separation.</p>
  </abstract>
    
<funding-group>
<award-group id="gs1">
<funding-source>National Natural Science Foundation of China</funding-source>
<award-id>52579030</award-id>
</award-group>
<award-group id="gs2">
<funding-source>Natural Science Foundation of Guangdong Province</funding-source>
<award-id>2025A1515011666</award-id>
<award-id>2025A1515012264</award-id>
</award-group>
</funding-group>
</article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e416">Baseflow is an essential component of streamflow, primarily originating from groundwater, deep interflow, snow melting, and other delayed sources (Xie et al., 2020; Wang et al., 2022; Stoelzle et al., 2020). The proportion of baseflow in streamflow reflects the complex interactions between surface water and groundwater systems (Pelletier and Andréassian, 2020; Xie et al., 2024), and understanding this proportion can aid in water resources management and riverine ecosystem conservation  (Yan et al., 2023; Tan et al., 2020). Baseflow is difficult to measure directly and it is usually estimated using baseflow separation methods  (Humphrey et al., 2022; Stewart, 2015), which take continuous streamflow data as the only inputs. The performance of baseflow separation is sensitive to parameters of the separation methods, which, if not optimized, may lead to unrealistic baseflow dynamics  (Mei et al., 2024b). Incorporating environmental tracer data for parameter optimization is a common practice, as it ensures reliable baseflow separation by maintaining dual mass balance for both tracer concentration and streamflow volume  (Cartwright, 2022; Hagedorn, 2020; McMahon and Nathan, 2021). Commonly used tracers include specific electrical conductivity (SEC), turbidity, and stable isotopes, among which SEC is the most widely applied due to its routine availability in many monitoring programs  (Mei et al., 2024b). However, a critical challenge arises as this method is not applicable for catchments without continuous tracer data, which unfortunately constitutes the majority of gaged catchments worldwide (Thorslund and van Vliet, 2020; Hou et al., 2024). This limitation hinders accurate quantification of baseflow in most global catchments, despite their long-term streamflow data.</p>
      <p id="d2e419">To optimize baseflow separation for gaged catchments lacking continuous environmental tracer data, a viable approach is to transfer optimized parameters from other catchments (Klotz et al., 2017; Feigl et al., 2020). Specifically, prediction models can be developed for these optimized parameters based on factors representing catchment physical conditions. This approach is fundamentally rooted in the hydrological similarity theory, which assumes that baseflow parameters reflect the catchment's hydrological signatures and relate to its physical characteristics  (Zhang et al., 2020; Gnann et al., 2021; McMillan et al., 2022; Price, 2011). While this parameter regionalization approach is widely used for transferring calibrated parameters to un-gaged catchments in hydrological modeling (Klotz et al., 2017; Feigl et al., 2020), its application in the context of baseflow parameters is unexplored. The smooth minima method (SMM) is a widely used method for baseflow separation, with a segment length parameter (<inline-formula><mml:math id="M20" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>) representing the average streamflow delay and catchment response (Stoelzle et al., 2020). This parameter is often defaulted to 5 d or estimated by an empirical power-law relationship with drainage area (<inline-formula><mml:math id="M21" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>) as <inline-formula><mml:math id="M22" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.6</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>  (Aksoy et al., 2008). However, Lin et al. (2026) found that while <inline-formula><mml:math id="M23" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> is the most influential predictor, incorporating additional factors representing geomorphology, climate, soil hydraulics properties, and human activities into the nonparametric random forest (RF) model yielded more accurate estimates than the power function. This highlights the complex interactions between streamflow delay and the diverse catchment characteristics (Price, 2011; Stoelzle et al., 2020).</p>
      <p id="d2e462">Despite higher prediction accuracy, the RF-based regionalization model does not provide an explicit analytical expression linking catchment attributes to parameter <inline-formula><mml:math id="M24" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>  (Rudin, 2019). Although tree-based models can be interpreted using post-hoc tools such as SHAP values and partial dependence plots, they provide only approximate, model-dependent interpretations rather than explicit functional relationships (Rudin, 2019; Makke and Chawla, 2024). Moreover, they typically describe average effects while overlooking higher-order interactions and may be sensitive to feature correlation, potentially leading to unstable or misleading explanations (Apley and Zhu, 2020; Sundararajan and Najmi, 2020). To develop interpretable regionalization models with structural transparency for the optimal baseflow parameters <inline-formula><mml:math id="M25" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>, this study employs an emerging machine learning technique called symbolic regression (SR), which focuses on data-driven identification of explicit mathematical expressions to describe relationships between predictors and target variable (Koza, 1994; Song et al., 2024). In recent years, SR has been increasingly applied in hydrology to uncover governing relationships in complex environmental systems, owing to its ability to balance predictive performance and interpretability (Chadalawada et al., 2020; Sheta et al., 2023). One example is the use of SR to extract explicit functional relationships between catchment attributes and hydrological model parameters for ungaged catchments (Li et al., 2024; Feigl et al., 2022). Unlike a “black-box” model such as RF, SR derives explicit and concise equations that identify underlying data patterns, while mitigating overfitting through complexity control (Kronberger et al., 2022; Wilstrup and Kasak, 2021). This structural transparency enables direct interpretation of how catchment attributes govern baseflow parameter values, which in terms influence the partitioning of streamflow (Klotz et al., 2017; Feigl et al., 2020; Sheta et al., 2023).</p>
      <p id="d2e479">To evaluate the effectiveness for regionalization of baseflow parameters, this study applies SR to model the segment length parameter of SMM and addresses three objectives: (a) assess the complexity-performance trade-off of SR-derived formulas for <inline-formula><mml:math id="M26" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>; (b) explore the functional relationships between <inline-formula><mml:math id="M27" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> and catchment attributes in the SR formulas; and (c) evaluate the different <inline-formula><mml:math id="M28" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s calculated by SR in baseflow separation. This study should not be viewed as an effort to assert a superior utility of SR over other machine learning models in the regionalization of baseflow parameters. Instead, the SR formulas serve as post-hoc interpretability tools to complement other black box models, enhancing the transparency of the underlying relationship between hydrological signatures and catchment attributes (Rudin, 2019).</p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Study catchments and data</title>
      <p id="d2e511">This study used the baseflow dataset produced by  Mei et al. (2024a), which contains the segment length parameter of SMM optimized by SEC for 987 catchments across the Conterminous United States (CONUS). To ensure the reliability of baseflow separation using the SMM method, catchments exhibiting suboptimal baseflow separation performance with a Kling Gupta Efficiency between estimated and observed SEC below 0.5 were excluded (Mei et al., 2024a). Additionally, catchments with incomplete attribute data (see the next paragraph for details) were also eliminated. After applying these criteria, a total of 855 catchments remained. The spatial distribution of these catchments, overlaid with drainage area, mean streamflow, and baseflow index (BFI), is depicted in Fig. 1a–c, showing significant diversity. The optimal <inline-formula><mml:math id="M29" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> parameters for these catchments are depicted in Fig. 1d with most values smaller than 17 d. Larger <inline-formula><mml:math id="M30" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> values tend to occur in mountainous regions characterized by drier climates and greater snow persistence with implicit spatial patterns, which may be attributed to the multifactor controls of <inline-formula><mml:math id="M31" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>  (Lin et al., 2026). The level 2 and level 4 Hydrological Unit Codes (HUC2 and HUC4), which represent large and sub-regional hydrologic basins in the United States, are provided for better referencing the spatial distributions of results in the analysis (Fig. 1e, f).</p>

      <fig id="F1" specific-use="star"><label>Figure 1</label><caption><p id="d2e537">Spatial distribution of the 855 selected catchments with their drainage area <bold>(a)</bold>, mean streamflow <bold>(b)</bold>, BFI <bold>(c)</bold>, and optimal segment length parameter <inline-formula><mml:math id="M32" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> <bold>(d)</bold> superimposed on HUC2 regions. The HUC2 and HUC4 region maps are provided for referencing <bold>(e, f)</bold>.</p></caption>
        <graphic xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026-f01.png"/>

      </fig>

      <p id="d2e569">Lin et al. (2026) identified 13 catchment characteristics representing the geomorphology, climate, soil hydraulic properties, and water usage, that significantly influence the SMM parameter <inline-formula><mml:math id="M33" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> (Table 1, rows 1–13). In addition to these predictors, we added two more related to snow processes and vegetation dynamics (Table 1, rows 14–15), as previous studies have shown that these factors can substantially affect baseflow generation (Price, 2011; Stoelzle et al., 2020; Xie et al., 2022). The data of these 15 variables are all obtained from Lin et al. (2025). To reduce the dimensionality of the predictor space, we examined the mutual information (MI) between candidate predictors. Variable pairs exhibiting MI values greater than 0.5 were considered to contain substantial shared information (Fig. S1 in the Supplement). In such cases, only one representative variable was retained to prevent redundant contributions in training the symbolic regression models. After this screening step, the number of predictors was reduced to nine (highlighted in blue in Table 1), which were then used as inputs for the SR analysis.</p>

<table-wrap id="T1" specific-use="star"><label>Table 1</label><caption><p id="d2e583">Catchment characteristics used as inputs to the SR method for predicting parameter <inline-formula><mml:math id="M34" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>. Catchment characteristics marked with an asterisk are selected for the development of SR based on the mutual information approach.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="3">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Name</oasis:entry>
         <oasis:entry colname="col3">Description (unit)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">1</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M35" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:msub><mml:mi mathvariant="normal">PE</mml:mi><mml:mi>x</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Maximum daily potential evapotranspiration (mm d<sup>−1</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">2</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M37" display="inline"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>X</mml:mi><mml:mi>x</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Maximum daily maximum temperature (<sup>∘</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">3</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M39" display="inline"><mml:mrow><mml:msub><mml:mi>P</mml:mi><mml:mn mathvariant="normal">95</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">The 95th percentile of daily precipitation larger than 0.01 mm (mm d<sup>−1</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">4</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M41" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:msub><mml:mi>P</mml:mi><mml:mn mathvariant="normal">50</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Median of daily precipitation larger than 0.01 mm (mm d<sup>−1</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">5</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M43" display="inline"><mml:mrow><mml:msub><mml:mi>P</mml:mi><mml:mn mathvariant="normal">5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">The 5th percentile of daily precipitation larger than 0.01 mm (mm d<sup>−1</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">6</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M45" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Proportion of days with precipitation larger than 0.01 mm (–)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">7</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M46" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">cly</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Volumetric fraction of clay (–)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">8</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M47" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:msub><mml:mi>W</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Saturated water capacity (%)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">9</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M48" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Saturated hydraulic conductivity (mm h<sup>−1</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">10</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M50" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:mi>A</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Catchment area (km<sup>2</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">11</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M52" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">E</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Elongation ratio (-)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">12</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M53" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:mover accent="true"><mml:mi>S</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Mean daily storage of reservoirs (<inline-formula><mml:math id="M54" display="inline"><mml:mrow><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mn mathvariant="normal">6</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> m<sup>3</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">13</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M56" display="inline"><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi mathvariant="normal">SD</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Standard deviation of daily storage of reservoirs (<inline-formula><mml:math id="M57" display="inline"><mml:mrow><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mn mathvariant="normal">6</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> m<sup>3</sup>)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">14</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M59" display="inline"><mml:mrow><mml:msup><mml:mi/><mml:mo>*</mml:mo></mml:msup><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Proportion of days with snow water equivalent larger than 0.05 mm (–)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">15</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M60" display="inline"><mml:mover accent="true"><mml:mi mathvariant="normal">LAI</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Mean 16-daily leaf area index (–)</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Methods</title>
<sec id="Ch1.S3.SS1">
  <label>3.1</label><title>Smooth Minima Baseflow Separation</title>
      <p id="d2e1109">SMM is a widely used baseflow separation method (Aksoy et al., 2008; Piggott et al., 2005; Xie et al., 2020; Tan et al., 2020). It assumes that total streamflow is partitioned into baseflow and event-flow components and baseflow constitutes 100 % of streamflow during low-flow periods (Gustard et al., 1992). The SMM procedure involves partitioning daily streamflow into non-overlapping <inline-formula><mml:math id="M61" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>-day intervals and identifying the minimum value within each segment. These minimum points (<inline-formula><mml:math id="M62" display="inline"><mml:mrow><mml:msub><mml:mi>Q</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M63" display="inline"><mml:mrow><mml:msub><mml:mi>Q</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M64" display="inline"><mml:mrow><mml:msub><mml:mi>Q</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, …) are then screened using a filtering coefficient (<inline-formula><mml:math id="M65" display="inline"><mml:mi>M</mml:mi></mml:math></inline-formula>): a point is discarded if  <inline-formula><mml:math id="M66" display="inline"><mml:mrow><mml:mi>M</mml:mi><mml:mo>⋅</mml:mo><mml:msub><mml:mi>Q</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> exceeds the value of either adjacent minimum. Finally, the baseflow series is constructed by linearly interpolating the remaining minima. The method involves two key parameters: the segment length parameter (<inline-formula><mml:math id="M67" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>) and the filtering coefficient parameter (<inline-formula><mml:math id="M68" display="inline"><mml:mi>M</mml:mi></mml:math></inline-formula>). The segment length parameter <inline-formula><mml:math id="M69" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> is a proxy of the flow event duration  (Stoelzle et al., 2020). Generally, a smaller <inline-formula><mml:math id="M70" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> results in a higher proportion of baseflow in streamflow, implying shorter surface flow duration. In the literature, <inline-formula><mml:math id="M71" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> often defaults to 5 d or is predicted using a power-law relationship with catchment area, namely <inline-formula><mml:math id="M72" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.6</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="M73" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> is the catchment area in km<sup>2</sup> and <inline-formula><mml:math id="M75" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> is expressed in days (Zhang et al., 2017; Aksoy et al., 2008). These two formulations of <inline-formula><mml:math id="M76" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> are included in the comparison and are denoted as <inline-formula><mml:math id="M77" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M78" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, respectively. To further examine the explanatory capacity of the areal-based power-law relationship, we considered a calibrated form of <inline-formula><mml:math id="M79" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mi>a</mml:mi><mml:mo>⋅</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mi>b</mml:mi></mml:msup></mml:mrow></mml:math></inline-formula> (denoted as <inline-formula><mml:math id="M80" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>), where the coefficients <inline-formula><mml:math id="M81" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M82" display="inline"><mml:mi>b</mml:mi></mml:math></inline-formula> are estimated from the data by minimizing the squared error between the reference and predicted <inline-formula><mml:math id="M83" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s.</p>
      <p id="d2e1336">The filtering coefficient parameter <inline-formula><mml:math id="M84" display="inline"><mml:mi>M</mml:mi></mml:math></inline-formula> is used to determine if a streamflow minimum qualifies as a strict baseflow point. Higher values of <inline-formula><mml:math id="M85" display="inline"><mml:mi>M</mml:mi></mml:math></inline-formula> (typically not exceeding 1) correspond to more stringent criteria for identifying pure baseflow conditions. Unlike <inline-formula><mml:math id="M86" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>, the parameter <inline-formula><mml:math id="M87" display="inline"><mml:mi>M</mml:mi></mml:math></inline-formula> is less sensitive to the baseflow separation results and is commonly assigned a constant value of 0.9 (Stoelzle et al., 2020; Aksoy et al., 2008).</p>
</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title>Symbolic regression modelling for the segment length parameter</title>
      <p id="d2e1375">Symbolic regression (SR) is employed to derive expressions for the parameter <inline-formula><mml:math id="M88" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>. SR represents an expression using a tree structure, where each node corresponds to a mathematical operator, and each leaf represents an input variable or constant. Structure of the tree evolves to identify expressions that best fit the inputted data through genetic programming  (Koza, 1994). Five sample SR trees were demonstrated within the dotted box in Fig. 2a. In this study, the SR method is implemented using the PySR library in Python (Cranmer, 2023), which enforces syntactically valid mathematical structures through predefined operator sets and expression tree representations. The nine representative catchment attributes in original units (Table 1) were used as predictors without normalization to maintain interpretability for the SR expressions. The function space consists of the catchment attributes, free constants, and a set of mathematical operators: addition (<inline-formula><mml:math id="M89" display="inline"><mml:mo lspace="0mm">+</mml:mo></mml:math></inline-formula>), subtraction (<inline-formula><mml:math id="M90" display="inline"><mml:mo lspace="0mm">-</mml:mo></mml:math></inline-formula>), multiplication (<inline-formula><mml:math id="M91" display="inline"><mml:mo lspace="0mm">×</mml:mo></mml:math></inline-formula>), division (<inline-formula><mml:math id="M92" display="inline"><mml:mo lspace="0mm">/</mml:mo></mml:math></inline-formula>), power-law (power), and logarithm (log).</p>

      <fig id="F2" specific-use="star"><label>Figure 2</label><caption><p id="d2e1415">Flowchart of the SR-based prediction framework for the parameter <inline-formula><mml:math id="M93" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> of SMM <bold>(a)</bold> and the three performance evaluation strategies <bold>(b)</bold>.</p></caption>
          <graphic xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026-f02.png"/>

        </fig>

      <p id="d2e1437">To control the search space and ensure physically interpretable expressions, several structural constraints were imposed in SR model training. Multiplication, division, power-law, and logarithmic operators were not allowed to be nested within operators of the same type. The internal complexity of expressions inside power-law and logarithmic operators was restricted to a maximum value of 3. The maximum allowable total complexity was set to 20. Expression complexity is defined as the sum of the complexity index assigned to each component in the equation. Take <inline-formula><mml:math id="M94" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.6</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> as an example, if multiplication and power-law operators are each assigned a complexity of 2 and constants and input variables are assigned a complexity of 1, the total complexity of the expression is calculated as <inline-formula><mml:math id="M95" display="inline"><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mo>=</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula>. In this study, all operators were assigned a uniform complexity index of 1 to avoid bias toward specific functional forms. Recursive formulations (i.e., expressions where the output variable appears as an input to itself) were not permitted to ensure model interpretability and avoid trivial or ill-posed solutions.</p>
      <p id="d2e1488">The SR search process was configured with the following hyperparameters: a population size of 33, populations of 15, the crossover rate of 0.066, and evolved over 40 generations. The goodness of fit between the reference and the predicted <inline-formula><mml:math id="M96" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s is evaluated using the mean squared error (MSE):

            <disp-formula id="Ch1.E1" content-type="numbered"><label>1</label><mml:math id="M97" display="block"><mml:mrow><mml:mi mathvariant="normal">MSE</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>C</mml:mi></mml:mfrac></mml:mstyle><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>C</mml:mi></mml:munderover><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>N</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>

          where <inline-formula><mml:math id="M98" display="inline"><mml:mi>C</mml:mi></mml:math></inline-formula> is the total number of catchments, and <inline-formula><mml:math id="M99" display="inline"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M100" display="inline"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>N</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> represent the reference and predicted values of <inline-formula><mml:math id="M101" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> for catchment <inline-formula><mml:math id="M102" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>, respectively. To evaluate the robustness of the SR models, a ten-fold cross-validation strategy is employed (Fig. 2a). The 855 catchments are randomly partitioned into ten subsets of approximately equal size. In each iteration, the model is trained on nine subsets and tested on the remaining one to estimate the generalization error. This process is repeated ten times so that each subset serves once as the testing set. In each iteration, 7 to 10 expressions with varying levels of complexity are generated, resulting in a total of 91 expressions. Among these expressions, we identified recurrent equation forms across all ten iterations.</p>
</sec>
<sec id="Ch1.S3.SS3">
  <label>3.3</label><title>Evaluation strategies</title>
      <p id="d2e1603">Three strategies are employed to evaluate the performance of different <inline-formula><mml:math id="M103" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s calculated by the SR formulas (Fig. 2b). The first strategy compares the predicted and reference <inline-formula><mml:math id="M104" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s using the mean bias (<inline-formula><mml:math id="M105" display="inline"><mml:mi>B</mml:mi></mml:math></inline-formula>) and coefficient of determination (<inline-formula><mml:math id="M106" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>):

                <disp-formula specific-use="gather" content-type="numbered"><mml:math id="M107" display="block"><mml:mtable displaystyle="true"><mml:mlabeledtr id="Ch1.E2"><mml:mtd><mml:mtext>2</mml:mtext></mml:mtd><mml:mtd><mml:mrow><mml:mstyle displaystyle="true" class="stylechange"/><mml:mi>B</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>C</mml:mi></mml:mfrac></mml:mstyle><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>C</mml:mi></mml:msubsup><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>N</mml:mi><mml:mo mathvariant="normal" stretchy="false">^</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr><mml:mlabeledtr id="Ch1.E3"><mml:mtd><mml:mtext>3</mml:mtext></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>C</mml:mi></mml:msubsup><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>N</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover><mml:mi>r</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>-</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>C</mml:mi></mml:msubsup><mml:msup><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>N</mml:mi><mml:mo mathvariant="normal" stretchy="false">^</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>C</mml:mi></mml:msubsup><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>N</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover><mml:mi>r</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr></mml:mtable></mml:math></disp-formula>

          where <inline-formula><mml:math id="M108" display="inline"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>N</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover><mml:mi>r</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="false"><mml:mfrac style="text"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>C</mml:mi></mml:mfrac></mml:mstyle><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>C</mml:mi></mml:munderover><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the mean of the reference <inline-formula><mml:math id="M109" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> over all catchments. Positive (negative) <inline-formula><mml:math id="M110" display="inline"><mml:mi>B</mml:mi></mml:math></inline-formula>s indicate overestimation (underestimation), with lower magnitudes suggesting better performance. <inline-formula><mml:math id="M111" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> measures the proportion of variance explained by the prediction; it ranges from 0 to 1, with higher values indicating better agreement.</p>
      <p id="d2e1875">The second strategy evaluates the SR-derived <inline-formula><mml:math id="M112" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> values in the context of baseflow separation using the SMM method. Specifically, the SMM baseflow time series are calculated using different <inline-formula><mml:math id="M113" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> values with the other parameter <inline-formula><mml:math id="M114" display="inline"><mml:mi>M</mml:mi></mml:math></inline-formula> fixed at 0.9 to eliminate its influence. Baseflow time series calculated with the reference <inline-formula><mml:math id="M115" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> for each catchment (<inline-formula><mml:math id="M116" display="inline"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) is used as the reference. The similarity between the calculated and reference baseflow is assessed using the Kling-Gupta Efficiency (KGE) metric  (Gupta et al., 2009):

            <disp-formula id="Ch1.E4" content-type="numbered"><label>4</label><mml:math id="M117" display="block"><mml:mrow><mml:mi mathvariant="normal">KGE</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mo>-</mml:mo><mml:msqrt><mml:mrow><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:mi mathvariant="italic">ρ</mml:mi><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msup><mml:mfenced close=")" open="("><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msub><mml:mi mathvariant="italic">σ</mml:mi><mml:mi>p</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi mathvariant="italic">σ</mml:mi><mml:mi>r</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msub><mml:mi mathvariant="italic">μ</mml:mi><mml:mi>p</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi mathvariant="italic">μ</mml:mi><mml:mi>r</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:msqrt><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>

          where <inline-formula><mml:math id="M118" display="inline"><mml:mi mathvariant="italic">ρ</mml:mi></mml:math></inline-formula> is the correlation coefficient between the predicted and reference baseflow, and <inline-formula><mml:math id="M119" display="inline"><mml:mi mathvariant="italic">μ</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M120" display="inline"><mml:mi mathvariant="italic">σ</mml:mi></mml:math></inline-formula> denote the mean and standard deviation of baseflow. KGE ranges from negative infinity to 1, with higher values indicating better agreement.</p>
      <p id="d2e2018">The third strategy compares SEC calculated using the SMM baseflow with the observed SEC. Specifically, baseflow time series generated by SMM using <inline-formula><mml:math id="M121" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s derived by the constant, the power-law, and the three SR formulas are used to estimate SEC based on the chemical and water balance relationship:

            <disp-formula id="Ch1.E5" content-type="numbered"><label>5</label><mml:math id="M122" display="block"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi mathvariant="normal">SEC</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msub><mml:mi mathvariant="normal">SEC</mml:mi><mml:mrow><mml:mi mathvariant="normal">s</mml:mi><mml:mo>,</mml:mo><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>Q</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>B</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mo>+</mml:mo><mml:msub><mml:mi mathvariant="normal">SEC</mml:mi><mml:mrow><mml:mi mathvariant="normal">b</mml:mi><mml:mo>,</mml:mo><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>B</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi>Q</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>

          where <inline-formula><mml:math id="M123" display="inline"><mml:mrow><mml:msub><mml:mi>Q</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M124" display="inline"><mml:mrow><mml:msub><mml:mi>B</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are the observed streamflow and the predicted baseflow at time <inline-formula><mml:math id="M125" display="inline"><mml:mi>t</mml:mi></mml:math></inline-formula>, respectively; SEC<sub>s,<italic>t</italic></sub> and SEC<sub>b,<italic>t</italic></sub> are the surface flow and baseflow SEC concentrations, respectively. The values of SEC<sub>s,<italic>t</italic></sub> and SEC<sub>b,<italic>t</italic></sub> are derived using the extreme value interpolation method, which connects the monthly maxima and minima of the observed SEC with spline interpolation to represent the stable variation of SEC in each of the flow components  (Mei et al., 2024b). The derivation of Eq. (5) is documented in Supplement Sect. S1 in the Supplement. The agreement between observed and predicted streamflow SEC is assessed using the <inline-formula><mml:math id="M130" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> metric (Eq. 1).</p>
      <p id="d2e2194">To assess whether the differences in SR-based SEC prediction performance are statistical significant, we apply the Diebold–Mariano (DM) test (Diebold and Mariano, 1995). Details on procedure and test statistics are provided in Section S2 in the Supplement. For each catchment, pairwise DM tests are performed among the three SR formulas to determine whether their SEC <inline-formula><mml:math id="M131" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> differences are statistical significance at the 0.01 significance level. If the largest <inline-formula><mml:math id="M132" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> is significantly different from the second-largest <inline-formula><mml:math id="M133" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>, the SR formula associated with the largest <inline-formula><mml:math id="M134" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> is the single best formula of the catchment. If the difference between the largest and the second-largest <inline-formula><mml:math id="M135" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>s is insignificant but that between the second and the third ones is significant, the first two SR formulas are tied. Otherwise, the three SR are tied. Based on these catchment-scale rankings, the best-performing formula for the HUC2 and HUC4 regions is determined as the one most frequently ranked as the best among all catchments within the regions.</p>
</sec>
</sec>
<sec id="Ch1.S4">
  <label>4</label><title>Results</title>
<sec id="Ch1.S4.SS1">
  <label>4.1</label><title>SR expressions for <inline-formula><mml:math id="M136" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions</title>
      <p id="d2e2276">Three SR formulas with identical functional structures and increasing complexity levels of 5, 13, and 17 were consistently identified across the ten cross-validation iterations. As summarized in Table 2, the simplest formulation is <inline-formula><mml:math id="M137" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub><mml:mo>:</mml:mo><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, followed by the intermediate formulation <inline-formula><mml:math id="M138" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>:</mml:mo><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mi>d</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:msub><mml:mi>c</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>e</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and the most complex formulation <inline-formula><mml:math id="M139" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:mo>:</mml:mo><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mi>d</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:msub><mml:mi>c</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>e</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:mo>⋅</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. The optimized coefficients of these replicated formulas vary only within narrow ranges (Table 2), indicating a high degree of consistency in parameterization across folds. From <inline-formula><mml:math id="M140" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> to <inline-formula><mml:math id="M141" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, the SR results progressively incorporate <inline-formula><mml:math id="M142" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>, <inline-formula><mml:math id="M143" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M144" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, suggesting that catchment size, subsurface permeability, and snow processes jointly govern the variability of <inline-formula><mml:math id="M145" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>. The repeated identification of these three formulations across all iterations further demonstrates their structural robustness for predicting <inline-formula><mml:math id="M146" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>. Accordingly, subsequent analyses focus on these three formulas.</p>

<table-wrap id="T2" specific-use="star"><label>Table 2</label><caption><p id="d2e2531">The calibrated <inline-formula><mml:math id="M147" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> and the three stable SR expressions across all ten iterations of the cross-validation. The numbers within the brackets of the first row are the complexity of the expressions.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="5">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Iteration</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M148" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">LR</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> (5)</oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M149" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (5)</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M150" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (13)</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M151" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (17)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">1</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M152" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.00</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M153" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.66</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M154" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.40</mml:mn><mml:msup><mml:mfenced close=")" open="("><mml:mrow><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">529</mml:mn></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">0.31</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.30</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.39</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M155" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.27</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">640</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.33</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.35</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.71</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.79</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">2</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M156" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.10</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M157" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.76</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M158" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.62</mml:mn><mml:msup><mml:mfenced close=")" open="("><mml:mrow><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">624</mml:mn></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">0.28</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.32</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.37</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M159" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.40</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">652</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.36</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.38</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.26</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">3</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M160" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.10</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M161" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.74</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M162" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.47</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">526</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.28</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.19</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M163" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.32</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">575</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.32</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.33</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.55</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.80</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">4</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M164" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.25</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.14</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M165" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.86</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M166" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.39</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">334</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.31</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.78</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M167" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.26</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">361</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.33</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.35</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.50</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.32</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">5</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M168" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.17</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M169" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.79</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M170" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.39</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">371</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.31</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.31</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.64</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M171" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.35</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">547</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.31</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.35</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.60</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.61</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">6</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M172" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.03</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M173" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.76</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M174" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.56</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">602</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.28</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.29</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.77</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M175" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.41</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">754</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.34</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.63</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.21</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">7</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M176" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.14</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M177" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.83</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M178" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.44</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">401</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.29</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.58</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M179" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.30</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">443</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.32</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.33</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.28</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.18</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">8</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M180" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.16</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M181" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.85</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M182" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.44</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">421</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.31</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.49</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M183" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.31</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">491</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.32</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.35</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.54</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.95</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">9</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M184" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.13</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M185" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.81</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M186" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.46</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">481</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.28</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.42</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M187" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.30</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">525</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.32</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.33</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.38</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.06</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">10</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M188" display="inline"><mml:mrow><mml:mn mathvariant="normal">3.14</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.15</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M189" display="inline"><mml:mrow><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.23</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.79</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M190" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.43</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">545</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.30</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.31</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.29</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M191" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.29</mml:mn><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">627</mml:mn><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">0.32</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi><mml:mn mathvariant="normal">0.35</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:mn mathvariant="normal">3.57</mml:mn><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.86</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e3806">Figure 3 further illustrates the behavior of these formulas. For <inline-formula><mml:math id="M192" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, the nearly identical exponents (<inline-formula><mml:math id="M193" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 0.23) and intercepts (3.66–3.86 d) result in almost overlapping curves (Fig. 3a), indicating a stable power-law relationship between <inline-formula><mml:math id="M194" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M195" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>, with a diminishing rate of increase. For <inline-formula><mml:math id="M196" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, the similarly constrained exponents (0.28–0.32) and intercepts (1.37–2.78 d) produce tightly clustered response curves (Fig. 3b–c), showing that both <inline-formula><mml:math id="M197" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M198" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> contribute positively to <inline-formula><mml:math id="M199" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>. <inline-formula><mml:math id="M200" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> extends <inline-formula><mml:math id="M201" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> by introducing <inline-formula><mml:math id="M202" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> as a linear term. The replicated formulas still exhibit closely grouped slopes (3.28–3.71 d) and intercepts (1.21–2.32 d), which explains the clustering of curves in Fig. 3d–f. The marginal relationships of <inline-formula><mml:math id="M203" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> with <inline-formula><mml:math id="M204" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M205" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> in <inline-formula><mml:math id="M206" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> remain consistent with those in <inline-formula><mml:math id="M207" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, whereas increasing <inline-formula><mml:math id="M208" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> leads to an approximately linear increase in <inline-formula><mml:math id="M209" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>, at a rate of about 0.3–0.4 d per 0.1 increment in snow fraction. Overall, SR identifies <inline-formula><mml:math id="M210" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> as the most influential factor in predicting <inline-formula><mml:math id="M211" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>, as evidenced by its presence in all SR-derived formulas. The narrower ranges of predicted <inline-formula><mml:math id="M212" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s in Fig. 3b and d also suggest that <inline-formula><mml:math id="M213" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> exerts greater influence than <inline-formula><mml:math id="M214" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M215" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>.</p>

      <fig id="F3" specific-use="star"><label>Figure 3</label><caption><p id="d2e4032">Marginal relationship of <inline-formula><mml:math id="M216" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> on different predictors (<inline-formula><mml:math id="M217" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>, <inline-formula><mml:math id="M218" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M219" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) that consist of the SR expressions (<inline-formula><mml:math id="M220" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M221" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M222" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>). Each line represents one of the ten instances of <inline-formula><mml:math id="M223" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M224" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M225" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. Panels a, b, and d are for <inline-formula><mml:math id="M226" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>; panels <bold>(c)</bold> and <bold>(e)</bold> are for <inline-formula><mml:math id="M227" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>; panel f is for <inline-formula><mml:math id="M228" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>.</p></caption>
          <graphic xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026-f03.png"/>

        </fig>

</sec>
<sec id="Ch1.S4.SS2">
  <label>4.2</label><title>Evaluation of <inline-formula><mml:math id="M229" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions</title>
      <p id="d2e4196">Figure 4 presents the performance of <inline-formula><mml:math id="M230" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predicted using the two literature-suggested formulas (<inline-formula><mml:math id="M231" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M232" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) and the three SR formulas (<inline-formula><mml:math id="M233" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M234" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M235" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>) for the ten training and testing sets. It should be noted that the literature-suggested formulas do not require training; instead, they are directly applied to the training and testing sets separately. Overall, the performance of formula <inline-formula><mml:math id="M236" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is poor, with negative <inline-formula><mml:math id="M237" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> values less than <inline-formula><mml:math id="M238" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>0.6. <inline-formula><mml:math id="M239" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> shows higher performance but still yields modest <inline-formula><mml:math id="M240" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> medians of 0.23 and 0.22 for the training and testing sets, respectively. The calibration with respect to SEC data improves the performance for <inline-formula><mml:math id="M241" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> to median <inline-formula><mml:math id="M242" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> values of 0.43 and 0.42 for the training and testing sets, respectively, and <inline-formula><mml:math id="M243" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> of 0.42 for the combined testing set. For predictions from the three SR-derived formulas, we observed higher performance than the conventional formulas. The <inline-formula><mml:math id="M244" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> medians for <inline-formula><mml:math id="M245" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M246" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M247" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> are 0.49, 0.53, and 0.56 for the training sets, and 0.45, 0.49, and 0.55 for the testing sets, respectively. The overall <inline-formula><mml:math id="M248" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> values for the ten testing sets together for <inline-formula><mml:math id="M249" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M250" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M251" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> are 0.48, 0.52, and 0.55, respectively. In terms of the bias, the SR-derived formulas significantly reduce the underestimation of <inline-formula><mml:math id="M252" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> by the conventional formulas (Fig. 4b). The medians <inline-formula><mml:math id="M253" display="inline"><mml:mi>B</mml:mi></mml:math></inline-formula> for <inline-formula><mml:math id="M254" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M255" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M256" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> are <inline-formula><mml:math id="M257" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.00</mml:mn><mml:mo>/</mml:mo><mml:mn mathvariant="normal">0.06</mml:mn></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M258" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.00</mml:mn><mml:mo>/</mml:mo><mml:mn mathvariant="normal">0.08</mml:mn></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M259" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.00</mml:mn><mml:mo>/</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.03</mml:mn></mml:mrow></mml:math></inline-formula> d for the training/testing sets, respectively, comparing to <inline-formula><mml:math id="M260" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M261" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> at <inline-formula><mml:math id="M262" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">4.44</mml:mn><mml:mo>/</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">4.38</mml:mn></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M263" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">2.34</mml:mn><mml:mo>/</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">2.28</mml:mn></mml:mrow></mml:math></inline-formula> d. These values for the combined testing set are <inline-formula><mml:math id="M264" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>4.44, <inline-formula><mml:math id="M265" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.33, 0.00, 0.00 and 0.00 d for <inline-formula><mml:math id="M266" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M267" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M268" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M269" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M270" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, respectively. It is noteworthy that the testing sets exhibit wider ranges of <inline-formula><mml:math id="M271" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M272" display="inline"><mml:mi>B</mml:mi></mml:math></inline-formula> values compared to the training sets. This variability is primarily attributed to the differences in catchment attributes of the testing samples rather than the discrepancies among the 10 replicated formulas. This is supported by the nearly identical coefficients (i.e., <inline-formula><mml:math id="M273" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula>, <inline-formula><mml:math id="M274" display="inline"><mml:mi>b</mml:mi></mml:math></inline-formula>, and <inline-formula><mml:math id="M275" display="inline"><mml:mi>c</mml:mi></mml:math></inline-formula>) in the SR formulas (Table 2).</p>

      <fig id="F4" specific-use="star"><label>Figure 4</label><caption><p id="d2e4691">Performance of <inline-formula><mml:math id="M276" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions using the constant (<inline-formula><mml:math id="M277" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), power-law (<inline-formula><mml:math id="M278" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), calibrated power-law (<inline-formula><mml:math id="M279" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>), and the three SR formulas (<inline-formula><mml:math id="M280" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M281" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M282" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>) for the ten training and testing sets of the 10-fold cross-validation: coefficient of determination <inline-formula><mml:math id="M283" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> <bold>(a)</bold> and mean bias <inline-formula><mml:math id="M284" display="inline"><mml:mi>B</mml:mi></mml:math></inline-formula> <bold>(b)</bold>.</p></caption>
          <graphic xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026-f04.png"/>

        </fig>

</sec>
<sec id="Ch1.S4.SS3">
  <label>4.3</label><title>Application of <inline-formula><mml:math id="M285" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions in baseflow separation</title>
      <p id="d2e4816">Figure 5a reveals the baseflow separation performance of different <inline-formula><mml:math id="M286" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions measured by KGE for the testing sets. The baseflow separation performance roughly follows the ranking of <inline-formula><mml:math id="M287" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub><mml:mo>&lt;</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub><mml:mo>&lt;</mml:mo><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup><mml:mo>&lt;</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub><mml:mo>&lt;</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>&lt;</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, in line with the <inline-formula><mml:math id="M288" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions (Fig. 4). The median KGEs for <inline-formula><mml:math id="M289" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M290" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M291" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M292" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M293" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M294" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> are 0.63, 0.73, 0.83, 0.84, 0.84, and 0.85, respectively. For <inline-formula><mml:math id="M295" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M296" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, 12 % and 5 % of catchments exhibit KGE <inline-formula><mml:math id="M297" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>, while 64 % and 78 % report KGE <inline-formula><mml:math id="M298" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0.5</mml:mn></mml:mrow></mml:math></inline-formula>, respectively. In contrast, the percentage of catchments with KGE <inline-formula><mml:math id="M299" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula> drops to 1 % for <inline-formula><mml:math id="M300" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M301" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M302" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M303" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and those with KGE <inline-formula><mml:math id="M304" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0.5</mml:mn></mml:mrow></mml:math></inline-formula> rise to more than 85 %. These observations indicate the benefits of performing regional calibration for the <inline-formula><mml:math id="M305" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> prediction.</p>

      <fig id="F5"><label>Figure 5</label><caption><p id="d2e5069">Baseflow separation performance based on different <inline-formula><mml:math id="M306" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions for all catchments <bold>(a)</bold> and for catchments of the 18 HUC2 regions <bold>(b)</bold>, and relative performance between each pair of the three SR cases for the HUC2 regions <bold>(c)</bold>. Regions with fewer than 10 catchments are plotted by dashed lines in panels <bold>(b)</bold> and <bold>(c)</bold>.</p></caption>
          <graphic xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026-f05.png"/>

        </fig>

      <p id="d2e5101">Figure 5b shows the performance of the three SR formulas across the 18 HUC2 regions. Overall, all formulas perform well for the HUC2 regions, with median KGEs ranging from 0.57 to 0.93. The best performing regions for <inline-formula><mml:math id="M307" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M308" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M309" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> are HUC 02, 01, and 07, respectively, exhibiting median KGE values above 0.89 and over 95 % of catchments achieving KGE values greater than 0.5. In contrast, the lowest performance for all three formulas occurs in HUC 12, where median KGE values fall below 0.65 and more than 25 % of catchments show KGE values below 0.5. This may be related to the relative arid climate and flashy hydrological response of HUC 12 (Kratzert et al., 2019; Feng et al., 2020), which is difficult for SMM to capture. Note that SMM is more skillful for smooth baseflow dynamics  (Stewart, 2015). All three formulas exhibit larger performance variability in HUC 10–12 and 14 compared to other regions. This can be attributed to the fact that these regions are mountainous and plain areas, characterized by relatively high heterogeneity in catchment characteristics.</p>
      <p id="d2e5138">Figure 5c compares the relative performance of <inline-formula><mml:math id="M310" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M311" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M312" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> across regions. <inline-formula><mml:math id="M313" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> outperforms <inline-formula><mml:math id="M314" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> for HUC 04-09 located in the northern and northeastern CONUS, while it performs worse than <inline-formula><mml:math id="M315" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in HUC 12–15 on the south. <inline-formula><mml:math id="M316" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> generally outperforms <inline-formula><mml:math id="M317" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in the mountainous region spanning HUC 10–11 and 13–18, and shows comparable performance to <inline-formula><mml:math id="M318" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in HUC 01, 02, 04, 05, and 07 with mild topography. In HUC 02, 04, 07, 08, 10, 11, 13, 14, 16, and 18, the most complex <inline-formula><mml:math id="M319" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> outperforms the other SR formulas. However, <inline-formula><mml:math id="M320" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> performs worse than <inline-formula><mml:math id="M321" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M322" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in HUC 12. This may be because the SR formulas were calibrated using all catchments to optimize performance at the CONUS scale; thus, their region-specific performance inevitably reflects trade-offs. In relatively warm regions such as HUC 12, where snow influence is weak, the SWE term included in <inline-formula><mml:math id="M323" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> may add unnecessary complexity rather than useful information, resulting in slightly poorer performance than <inline-formula><mml:math id="M324" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M325" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>.</p>
      <p id="d2e5319">Figure 6 presents the average KGE of baseflow separation as functions of the three influential catchment attributes. Overall, the SR formulas consistently outperform the literature-suggested formulas for most of the predictor value ranges, with relatively minor performance differences among <inline-formula><mml:math id="M326" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M327" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M328" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, highlighting their robustness across diverse catchment conditions. According to Fig. 6a, when <inline-formula><mml:math id="M329" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> exceeds 300 km<sup>2</sup>, corresponding to <inline-formula><mml:math id="M331" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> d by <inline-formula><mml:math id="M332" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, the performance of <inline-formula><mml:math id="M333" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> deteriorates markedly. This suggests that using <inline-formula><mml:math id="M334" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> d cannot adequately represent its variation for larger <inline-formula><mml:math id="M335" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>s. Conversely, for <inline-formula><mml:math id="M336" display="inline"><mml:mrow><mml:mi>A</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&lt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">300</mml:mn></mml:mrow></mml:math></inline-formula> km<sup>2</sup>, the performance of <inline-formula><mml:math id="M338" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> declines, indicating that the power function coefficients are not suitable for smaller catchments over CONUS. The calibrated power-function (<inline-formula><mml:math id="M339" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>) reveals improved performance to a similar level with the SR formulas except for the <inline-formula><mml:math id="M340" display="inline"><mml:mrow><mml:mi>A</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&lt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">100</mml:mn></mml:mrow></mml:math></inline-formula> km<sup>2</sup> bin, indicating the necessity regional calibration. Across the full range of <inline-formula><mml:math id="M342" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>, the SR formulas consistently achieve higher KGE values, emphasizing the benefits of regional calibration. For small catchment (<inline-formula><mml:math id="M343" display="inline"><mml:mrow><mml:mi>A</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&lt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">100</mml:mn></mml:mrow></mml:math></inline-formula> km<sup>2</sup>), accounting for <inline-formula><mml:math id="M345" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M346" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> leads to performance gains. In contrast, for larger basins (<inline-formula><mml:math id="M347" display="inline"><mml:mrow><mml:mi>A</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&gt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">100</mml:mn></mml:mrow></mml:math></inline-formula> km<sup>2</sup>), the additional contribution of these factors becomes negligible.</p>

      <fig id="F6" specific-use="star"><label>Figure 6</label><caption><p id="d2e5574">Performance of baseflow separation for different ranges of catchment area <bold>(a)</bold>, catchment-averaged saturated hydraulic conductivity <bold>(b)</bold>, and snow day fraction <bold>(c)</bold>. The right <inline-formula><mml:math id="M349" display="inline"><mml:mi>y</mml:mi></mml:math></inline-formula>-axis for panel <bold>(b)</bold> is in logarithmic scale.</p></caption>
          <graphic xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026-f06.png"/>

        </fig>

      <p id="d2e5602">Figure 6b examines the influence of <inline-formula><mml:math id="M350" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>. When <inline-formula><mml:math id="M351" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&lt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> mm h<sup>−1</sup>, all predictions show similar level of baseflow prediction performance, suggesting that <inline-formula><mml:math id="M353" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is not a major factor for catchments with low soil hydraulic conductivity. In the intermediate ranges (5–25 mm h<sup>−1</sup>), the two regionally fitted power-law formulas (<inline-formula><mml:math id="M355" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M356" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>) outperform the conventional power-law formula (<inline-formula><mml:math id="M357" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>). Although <inline-formula><mml:math id="M358" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M359" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> do not explicitly include <inline-formula><mml:math id="M360" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, their performance remains comparable to <inline-formula><mml:math id="M361" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M362" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, which incorporate <inline-formula><mml:math id="M363" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>. This indicates that regional fitting may compensate the effects of <inline-formula><mml:math id="M364" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> for small and medium values. When <inline-formula><mml:math id="M365" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&gt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">25</mml:mn></mml:mrow></mml:math></inline-formula> mm h<sup>−1</sup>, incorporating <inline-formula><mml:math id="M367" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> substantially improves the predictions, highlighting the increasing importance of subsurface processes in highly permeable catchments. Figure 6c reveals the influence of <inline-formula><mml:math id="M368" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>. <inline-formula><mml:math id="M369" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> outperforms all formulas when <inline-formula><mml:math id="M370" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mo>&gt;</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">0.4</mml:mn></mml:mrow></mml:math></inline-formula>, indicating the importance of <inline-formula><mml:math id="M371" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> for catchments with stronger snow persistency. In contrast, for <inline-formula><mml:math id="M372" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mo>&lt;</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">0.4</mml:mn></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M373" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M374" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M375" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> perform similarly to <inline-formula><mml:math id="M376" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, demonstrating that regionally calibrated coefficients can partially offset the lack of explicit consideration of snow-related variables.</p>
</sec>
<sec id="Ch1.S4.SS4">
  <label>4.4</label><title>Estimation of SEC variation based on predicted <inline-formula><mml:math id="M377" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula></title>
      <p id="d2e5954">The SEC estimation performance by different <inline-formula><mml:math id="M378" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions for the testing set is evaluated using <inline-formula><mml:math id="M379" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>. The median <inline-formula><mml:math id="M380" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> values range from 0.70 to 0.74 for the <inline-formula><mml:math id="M381" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M382" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M383" display="inline"><mml:mrow><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M384" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M385" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M386" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> formulas, with similar interquartile ranges between 0.29 and 0.33, indicating relatively small overall differences among formulas. Despite these modest differences, both the medians and interquartile ranges of <inline-formula><mml:math id="M387" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> follow a clear order of <inline-formula><mml:math id="M388" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:msub><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&lt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msub><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi></mml:msub><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mo>&lt;</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msubsup><mml:mi>F</mml:mi><mml:mi mathvariant="normal">PL</mml:mi><mml:mo>′</mml:mo></mml:msubsup><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mo>&lt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub><mml:mo>&lt;</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>&lt;</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. This ranking is consistent with both the <inline-formula><mml:math id="M389" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions (Fig. 4) and the baseflow separation results (Fig. 5). The mean <inline-formula><mml:math id="M390" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> differences between most formulas are statistically significant, except for the comparison between <inline-formula><mml:math id="M391" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M392" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (<inline-formula><mml:math id="M393" display="inline"><mml:mrow><mml:mi>p</mml:mi><mml:mo>≥</mml:mo><mml:mn mathvariant="normal">0.01</mml:mn></mml:mrow></mml:math></inline-formula>).</p>
      <p id="d2e6174">Figure 7 illustrates the spatial distribution of the best-performing formulas across the HUC4 regions. <inline-formula><mml:math id="M394" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> demonstrates superior performance across most of the mountainous regions, including the Rocky Mountain foothills, Cascade Range, Sierra Nevada, and some regions within the Great Plains. The improvement for the mountainous regions is likely due to the explicit incorporation of <inline-formula><mml:math id="M395" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> in the SR formula, capturing the influence of snow processes; for the relatively flat Great Plains regions, the improvement is primarily driven by the consideration of <inline-formula><mml:math id="M396" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, which better represents subsurface processes such as infiltration capacity, percolation, and lateral subsurface flow that regulate groundwater recharge and baseflow contributions. In contrast, <inline-formula><mml:math id="M397" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> performs best in the eastern and southeastern CONUS, including the Appalachian Mountains, coastal plain, and Florida peninsular, where the effects of <inline-formula><mml:math id="M398" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M399" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are minimal. These regions are generally characterized by low BFI values (Fig. 1c), indicating surface runoff-dominated streamflow with limited relevance of delayed-flow processes (Wu et al., 2021; Mcmillan, 2020). <inline-formula><mml:math id="M400" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> achieves the highest performance in fewer HUC4 regions, indicating that the effects of <inline-formula><mml:math id="M401" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> may be compensated by the regional calibration of <inline-formula><mml:math id="M402" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. Interestingly, several regions located in the Great Plains exhibit mixed optimal performance for multiple formulas, suggesting a more complex interplay of hydrological drivers in these areas.</p>

      <fig id="F7"><label>Figure 7</label><caption><p id="d2e6279">Spatial distribution of the best-performing formulas for SEC estimations across different HUC4 regions. At the HUC4 scale, the best-performing formula is the one(s) appears most frequently as the best among all catchments within the region.</p></caption>
          <graphic xlink:href="https://hess.copernicus.org/articles/30/3425/2026/hess-30-3425-2026-f07.png"/>

        </fig>

</sec>
</sec>
<sec id="Ch1.S5">
  <label>5</label><title>Discussions</title>
<sec id="Ch1.S5.SS1">
  <label>5.1</label><title>Regionalization of baseflow separation parameter by SR</title>
      <p id="d2e6305">In this study, we used SR to derive mathematical expressions for the predictions of <inline-formula><mml:math id="M403" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> using 9 catchment attributes. Across ten cross-validation iterations, the identified expressions exhibited consistent structures, predictors, and nearly identical regression coefficients, indicating that SR can yield stable functional relationships between catchment attributes and <inline-formula><mml:math id="M404" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>. Compared to the RF-based predictions reported by  Lin et al. (2026), the SR-based approach showed lower predictive skill (<inline-formula><mml:math id="M405" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo></mml:mrow></mml:math></inline-formula> 0.54 vs. 0.80), reflecting the trade-off between predictive accuracy and interpretability. While RF achieves superior predictive performance, it functions as a “black-box” ensemble, offering no explicit functional form to clarify whether environmental controls operate additively, multiplicatively, or through nonlinear transformations. In contrast, SR provides structural transparency by yielding a closed-form equation, facilitating direct analytical insights  (Karpatne et al., 2024; Häfner et al., 2023). This explicit representation enables rigorous sensitivity analysis via differentiation; for instance, the marginal effects derived from equation <inline-formula><mml:math id="M406" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> quantify how geomorphic and climatic factors jointly govern <inline-formula><mml:math id="M407" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>. By trading a degree of predictive skill for parsimony, SR transforms the problem from simple estimation into a hypothesis-generating exercise, providing compact transfer functions that are easily integrated into regionalization frameworks (Feigl et al., 2022; Samaniego et al., 2010). Therefore, RF and SR should be viewed as complementary rather than competing approaches: RF provides a benchmark for predictive performance, while SR offers structural transparency that facilitates theoretical interpretation and model integration.</p>
      <p id="d2e6353">One important aspect to consider when training SR models is the diversity of mathematical operators. A wide variety of operators for model training enables the discovery of complex relationships among variables, but it also enlarges the search space, increasing training time and risk of overfitting (Li et al., 2025; Elsken et al., 2019). To address these challenges, we adopted two strategies. First, we incorporated domain knowledge to guide the choice of operators. Specifically, the well-established power-law relationship between streamflow response time and catchment area motivated the inclusion of the power-law operator in the SR operator set. The fact that all SR-derived formulas captured this power-law relationship indicates the effectiveness of using this domain knowledge. Second, cross-validation was applied to assess model generalizability and reduce overfitting, ensuring representativeness of the SR expressions across the catchments. Although SR can generate more complex formulas than <inline-formula><mml:math id="M408" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> with better training fit, these structures are inconsistent across folds. This suggests that they may overfit specific subsets of the data and lack generalizability, and are therefore excluded from our analysis.</p>
</sec>
<sec id="Ch1.S5.SS2">
  <label>5.2</label><title>Influential catchment attributes for <inline-formula><mml:math id="M409" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> predictions</title>
      <p id="d2e6384">The segment length parameter <inline-formula><mml:math id="M410" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> is a proxy of the average duration of surface flow, and larger values indicate surface flow of event sustain for longer time on average (Stoelzle et al., 2020). Our findings indicate that <inline-formula><mml:math id="M411" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> is a power function of catchment area with exponent of 0.22–0.23 (<inline-formula><mml:math id="M412" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, Table 2), indicating that larger catchments are characterized by longer average surface flow duration (Garzon et al., 2023; Mei and Anagnostou, 2015), and the increasing rate in duration slows down for larger <inline-formula><mml:math id="M413" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>s. This could be attributed to the longer averaged water paths for larger catchments (i.e., the Hack's Law), increasing the average traveling time for surface flow of event  (Tarasova et al., 2024). Saturated hydraulic conductivity is another key factor in the predictions of <inline-formula><mml:math id="M414" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>: <inline-formula><mml:math id="M415" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> increases according to the power-law functions with exponents of 0.28–0.36 with respect to <inline-formula><mml:math id="M416" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> (<inline-formula><mml:math id="M417" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M418" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in Table 2). This indicates that higher <inline-formula><mml:math id="M419" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>values tend to increase the average duration of surface flow with decreasing rate. A possible explanation is that catchments with higher <inline-formula><mml:math id="M420" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> tend to promote infiltration, making more rainfall excess to route through the slow subsurface flow paths than the rapid overland ones (Nagy et al., 2024). <inline-formula><mml:math id="M421" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> reveals that prolonged snow cover (higher fraction of days covered by snow) is linearly associated with longer surface flow duration. This is due to the snowpack acting as a seasonal storage that modulates streamflow timing (Stoelzle et al., 2020). The gradual melting of snowpack slowly released meltwater to the stream networks, increasing the time needed to leave the catchment (Noor et al., 2023; Barnhart et al., 2016; Godsey et al., 2014). Overall, the additive structure among <inline-formula><mml:math id="M422" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>, <inline-formula><mml:math id="M423" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M424" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> reflect the separate contributions of different catchment-scale delay processes to the event flow through different pathways and at different time scales. Their additive combination therefore provides a parsimonious empirical approximation of the integrated flow-duration response.</p>
</sec>
<sec id="Ch1.S5.SS3">
  <label>5.3</label><title>Trade-off between formula complexity and prediction accuracy</title>
      <p id="d2e6538">Our experiments reveal that formulas for baseflow separation with higher structural complexity generally achieve better predictive performance. This is because more complex formulas can incorporate additional predictors for more detailed descriptions of the underlying hydrological processes. However, the predictive gain from increased complexity is not uniform across all hydro-climatic conditions. For example, when <inline-formula><mml:math id="M425" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M426" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> take relatively small values (<inline-formula><mml:math id="M427" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&lt;</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">25</mml:mn></mml:mrow></mml:math></inline-formula> mm h<sup>−1</sup> and <inline-formula><mml:math id="M429" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mo>&lt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">0.4</mml:mn></mml:mrow></mml:math></inline-formula>), the performance differences among <inline-formula><mml:math id="M430" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M431" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M432" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> are minimal (Fig. 6). This is likely because small variations in <inline-formula><mml:math id="M433" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M434" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> have limited impact to the prediction, allowing the regional calibration to partially compensate for the absence of these variables in the formulas. However, such compensation is limited for large <inline-formula><mml:math id="M435" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M436" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> (<inline-formula><mml:math id="M437" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mo>&gt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">25</mml:mn></mml:mrow></mml:math></inline-formula> mm h<sup>−1</sup> and <inline-formula><mml:math id="M439" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&gt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">0.4</mml:mn></mml:mrow></mml:math></inline-formula>), where their influence becomes more pronounced (Jenicek and Ledvinka, 2020; Beven and Germann, 2013). Moreover, the effects of <inline-formula><mml:math id="M440" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M441" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are more evident when <inline-formula><mml:math id="M442" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula> is smaller than 100 km<sup>2</sup> (Fig. 6a). As catchment area increases (<inline-formula><mml:math id="M444" display="inline"><mml:mrow><mml:mi>A</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>&gt;</mml:mo><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mn mathvariant="normal">100</mml:mn></mml:mrow></mml:math></inline-formula> km<sup>2</sup>), their influence is outweighed by <inline-formula><mml:math id="M446" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>, highlighting the dominant role of drainage area in shaping the streamflow response time (McGlynn et al., 2004; Sólyom and Tucker, 2007).</p>
</sec>
</sec>
<sec id="Ch1.S6" sec-type="conclusions">
  <label>6</label><title>Conclusions and future work</title>
      <p id="d2e6812">In this study, we applied symbolic regression to derive formulas for the prediction of segment length parameter <inline-formula><mml:math id="M447" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> (a proxy of the average duration of surface flow) of the smooth minima baseflow separation method across 855 CONUS catchments. Three stable formulas with increasing complexity were identified: <inline-formula><mml:math id="M448" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:msup><mml:mi>A</mml:mi><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M449" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mi>d</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:msub><mml:mi>c</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>e</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M450" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mi>d</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:mo>(</mml:mo><mml:mi>A</mml:mi><mml:mo>+</mml:mo><mml:msub><mml:mi>c</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mrow><mml:msub><mml:mi>e</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:mo>⋅</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, where catchment area (<inline-formula><mml:math id="M451" display="inline"><mml:mi>A</mml:mi></mml:math></inline-formula>), saturated hydraulic conductivity (<inline-formula><mml:math id="M452" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), and snow day fraction (<inline-formula><mml:math id="M453" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) are identified as important predictors. These SR formulas showed substantial improvements in predictive accuracy of <inline-formula><mml:math id="M454" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> comparing to the constant (<inline-formula><mml:math id="M455" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula>) and power-law formula (<inline-formula><mml:math id="M456" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.6</mml:mn><mml:msup><mml:mi>A</mml:mi><mml:mn mathvariant="normal">0.2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>). The SR-derived <inline-formula><mml:math id="M457" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>s also reveal better performance in baseflow separation and in estimation of electrical conductance dynamics. Among the three SR formulas, <inline-formula><mml:math id="M458" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> performs better in regions influenced by snow, such as the mountainous mid-west and the northern CONUS; <inline-formula><mml:math id="M459" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>  shows better performance in the eastern and southeastern CONUS, where both the climate and terrain are mild and infiltration rate is low. Overall, formulas that consider <inline-formula><mml:math id="M460" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M461" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> tend to yield higher predictive accuracy, but simpler formulas without <inline-formula><mml:math id="M462" display="inline"><mml:mrow><mml:msub><mml:mi>K</mml:mi><mml:mi mathvariant="normal">sat</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> or <inline-formula><mml:math id="M463" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi mathvariant="normal">SWE</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> can still achieve comparable performance when the values of these key predictors are relatively small. This study presents a new paradigm for regionalization of optimal baseflow parameters using symbolic regression and demonstrates its potential to improve model interpretability and transferability across diverse catchments.</p>
      <p id="d2e7124">This study used all gages across CONUS to train SR. However, the influence of catchment attributes on <inline-formula><mml:math id="M464" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> varies across regions. Future work could explore the benefits of developing region-specific SR formulas for different catchment clusters to improve the prediction performance. Furthermore, this study investigated SR-based modeling of only one parameter of a baseflow separation method. Future research could explore applying SR to other baseflow separation methods to identify the governing equations relating catchment attributes to the parameters of these methods. This may help to understand how catchment attributes influence the partitioning of streamflow.</p>
</sec>

      
      </body>
    <back><notes notes-type="codedataavailability"><title>Code and data availability</title>

      <p id="d2e7138">The streamflow and baseflow time series and optimal baseflow filters parameters are available on Mei et al. (2024a, <ext-link xlink:href="https://doi.org/10.5281/zenodo.8388365" ext-link-type="DOI">10.5281/zenodo.8388365</ext-link>). The HUC region maps are downloaded from Climate Mapping for Resilience &amp; Adaptation (CMRA). The catchment attributes of the 855 catchments are available on Lin et al. (2025, <ext-link xlink:href="https://doi.org/10.5281/zenodo.16924118" ext-link-type="DOI">10.5281/zenodo.16924118</ext-link>).</p>
  </notes><app-group>
        <supplementary-material position="anchor"><p id="d2e7147">The supplement related to this article is available online at <inline-supplementary-material xlink:href="https://doi.org/10.5194/hess-30-3425-2026-supplement" xlink:title="pdf">https://doi.org/10.5194/hess-30-3425-2026-supplement</inline-supplementary-material>.</p></supplementary-material>
        </app-group><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e7156">Yongen Lin: Conceptualization, Methodology, Data curation, Formal analysis, Visualization, investigation, validation, writing – original draft; Dagang Wang: Conceptualization, Methodology, Writing – review &amp; editing, supervision, Resources, funding acquisition, project administration; Yiwen Mei: Conceptualization, Methodology, Writing – review &amp; editing, supervision, Resources, funding acquisition; Jinxin Zhu: Methodology, Writing – review &amp; editing; Huan Wu: Writing – review &amp; editing; Shuo Wang: Writing – review &amp; editing; Zhonghou Xu: Resources, Writing – review &amp; editing; Asaad Y. Shamseldin: Resources, Writing – review &amp; editing; Emmanouil N. Anagnostou: Writing – review &amp; editing.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e7162">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e7168">Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. The authors bear the ultimate responsibility for providing appropriate place names. Views expressed in the text are those of the authors and do not necessarily reflect the views of the publisher.</p>
  </notes><ack><title>Acknowledgements</title><p id="d2e7174">This paper is dedicated to the memory of Professor Asaad Y. Shamseldin, whose guidance were invaluable to this work. He passed away in February 2026 and is deeply missed.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e7179">This work is supported by the National Natural Science Foundation of China (grant no. 52579030) and the Guangdong Natural Science Foundation (grant nos. 2025A1515011666 and 2025A1515012264).</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e7186">This paper was edited by Rohini Kumar and reviewed by four anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bib1"><label>1</label><mixed-citation>Aksoy, H., Unal, N. E., and Pektas, A. O.: Smoothed minima baseflow separation tool for perennial and intermittent streams, Hydrol. Process., 22, 4467–4476, <ext-link xlink:href="https://doi.org/10.1002/hyp.7077" ext-link-type="DOI">10.1002/hyp.7077</ext-link>, 2008.</mixed-citation></ref>
      <ref id="bib1.bib2"><label>2</label><mixed-citation> Apley, D. W. and Zhu, J.: Visualizing the Effects of Predictor Variables in Black Box Supervised Learning Models, J. Roy. Stat. Soc. B, 82, 1059–1086, 10.1111/rssb.12377, 2020.</mixed-citation></ref>
      <ref id="bib1.bib3"><label>3</label><mixed-citation>Barnhart, T. B., Molotch, N. P., Livneh, B., Harpold, A. A., Knowles, J. F., and Schneider, D.: Snowmelt rate dictates streamflow, Geophys. Res. Lett., 43, 8006–8016, <ext-link xlink:href="https://doi.org/10.1002/2016GL069690" ext-link-type="DOI">10.1002/2016GL069690</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib4"><label>4</label><mixed-citation>Beven, K. and Germann, P.: Macropores and water flow in soils revisited, Water Resour. Res., 49, 3071–3092, <ext-link xlink:href="https://doi.org/10.1002/wrcr.20156" ext-link-type="DOI">10.1002/wrcr.20156</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib5"><label>5</label><mixed-citation>Cartwright, I.: Implications of variations in stream specific conductivity for estimating baseflow using chemical mass balance and calibrated hydrograph techniques, Hydrol. Earth Syst. Sci., 26, 183–195, <ext-link xlink:href="https://doi.org/10.5194/hess-26-183-2022" ext-link-type="DOI">10.5194/hess-26-183-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib6"><label>6</label><mixed-citation>Chadalawada, J., Herath, H. M. V. V., and Babovic, V.: Hydrologically Informed Machine Learning for Rainfall-Runoff Modeling: A Genetic Programming-Based Toolkit for Automatic Model Induction, Water Resour. Res., 56, e2019WR026933, <ext-link xlink:href="https://doi.org/10.1029/2019WR026933" ext-link-type="DOI">10.1029/2019WR026933</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib7"><label>7</label><mixed-citation>Cranmer, M.: Interpretable machine learning for science with PySR and SymbolicRegression.jl, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2305.01582" ext-link-type="DOI">10.48550/arXiv.2305.01582</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib8"><label>8</label><mixed-citation> Diebold, F. X. and Mariano, R. S.: Comparing Predictive Accuracy, J. Bus. Econ. Stat., 13, 253–263, 10.1080/07350015.1995.10524599, 1995.</mixed-citation></ref>
      <ref id="bib1.bib9"><label>9</label><mixed-citation> Elsken, T., Metzen, J. H., and Hutter, F.: Neural architecture search: a survey, J. Mach. Learn. Res., 20, 1997–2017, 2019.</mixed-citation></ref>
      <ref id="bib1.bib10"><label>10</label><mixed-citation> Feigl, M., Herrnegger, M., Klotz, D., and Schulz, K.: Function Space Optimization: A Symbolic Regression Method for Estimating Parameter Transfer Functions for Hydrological Models, Water Resour. Res., 56, e2020WR027385, 10.1029/2020WR027385, 2020.</mixed-citation></ref>
      <ref id="bib1.bib11"><label>11</label><mixed-citation>Feigl, M., Thober, S., Schweppe, R., Herrnegger, M., Samaniego, L., and Schulz, K.: Automatic Regionalization of Model Parameters for Hydrological Models, Water Resour. Res., 58, e2022WR031966, <ext-link xlink:href="https://doi.org/10.1029/2022WR031966" ext-link-type="DOI">10.1029/2022WR031966</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib12"><label>12</label><mixed-citation>Feng, D., Fang, K., and Shen, C.: Enhancing Streamflow Forecast and Extracting Insights Using Long-Short Term Memory Networks With Data Integration at Continental Scales, Water Resour. Res., 56, e2019WR026793, <ext-link xlink:href="https://doi.org/10.1029/2019wr026793" ext-link-type="DOI">10.1029/2019wr026793</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib13"><label>13</label><mixed-citation>Garzon, L. F. L., Johnson, M. F., Mount, N., and Gomez, H.: Exploring the effects of catchment morphometry on overland flow response to extreme rainfall using a 2D hydraulic-hydrological model (IBER), J. Hydrol., 627, 130405, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2023.130405" ext-link-type="DOI">10.1016/j.jhydrol.2023.130405</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib14"><label>14</label><mixed-citation>Gnann, S. J., McMillan, H. K., Woods, R. A., and Howden, N. J. K.: Including Regional Knowledge Improves Baseflow Signature Predictions in Large Sample Hydrology, Water Resour. Res., 57, e2020WR028354, <ext-link xlink:href="https://doi.org/10.1029/2020WR028354" ext-link-type="DOI">10.1029/2020WR028354</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib15"><label>15</label><mixed-citation>Godsey, S. E., Kirchner, J. W., and Tague, C. L.: Effects of changes in winter snowpacks on summer low flows: case studies in the Sierra Nevada, California, USA, Hydrol. Process., 28, 5048–5064, <ext-link xlink:href="https://doi.org/10.1002/hyp.9943" ext-link-type="DOI">10.1002/hyp.9943</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib16"><label>16</label><mixed-citation> Gupta, H. V., Kling, H., Yilmaz, K. K., and Martinez, G. F.: Decomposition of the mean squared error and NSE performance criteria: Implications for improving hydrological modelling, J. Hydrol., 377, 80–91, 10.1016/j.jhydrol.2009.08.003, 2009.</mixed-citation></ref>
      <ref id="bib1.bib17"><label>17</label><mixed-citation> Gustard, A., Bullock, A. D., and Dixon, J. M.: Low Flow Estimation in the United Kingdom, Institute of Hydrology, Wallingford, UK, ISBN 0948540451, 1992.</mixed-citation></ref>
      <ref id="bib1.bib18"><label>18</label><mixed-citation>Häfner, D., Gemmrich, J., and Jochum, M.: Machine-guided discovery of a real-world rogue wave model, P. Natl. Acad. Sci. USA, 120, e2306275120, <ext-link xlink:href="https://doi.org/10.1073/pnas.2306275120" ext-link-type="DOI">10.1073/pnas.2306275120</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib19"><label>19</label><mixed-citation>Hagedorn, B.: Hydrograph separation through multi objective optimization: Revealing the importance of a temporally and spatially constrained baseflow solute source, J. Hydrol., 590, 125349, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2020.125349" ext-link-type="DOI">10.1016/j.jhydrol.2020.125349</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib20"><label>20</label><mixed-citation>Hou, X., Xie, D., Feng, L., Shen, F., and Nienhuis, J. H.: Sustained increase in suspended sediments near global river deltas over the past two decades, Nat. Commun., 15, 3319, <ext-link xlink:href="https://doi.org/10.1038/s41467-024-47598-6" ext-link-type="DOI">10.1038/s41467-024-47598-6</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib21"><label>21</label><mixed-citation>Humphrey, C. E., Solomon, D. K., Genereux, D. P., Gilmore, T. E., Mittelstet, A. R., Zlotnik, V. A., Zeyrek, C., Jensen, C. R., and MacNamara, M. R.: Using Automated Seepage Meters to Quantify the Spatial Variability and Net Flux of Groundwater to a Stream, Water Resour. Res., 58, e2021WR030711, <ext-link xlink:href="https://doi.org/10.1029/2021WR030711" ext-link-type="DOI">10.1029/2021WR030711</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib22"><label>22</label><mixed-citation>Jenicek, M. and Ledvinka, O.: Importance of snowmelt contribution to seasonal runoff and summer low flows in Czechia, Hydrol. Earth Syst. Sci., 24, 3475–3491, <ext-link xlink:href="https://doi.org/10.5194/hess-24-3475-2020" ext-link-type="DOI">10.5194/hess-24-3475-2020</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib23"><label>23</label><mixed-citation>Karpatne, A., Jia, X., and Kumar, V.: Knowledge-guided machine learning: Current trends and future prospects, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2403.15989" ext-link-type="DOI">10.48550/arXiv.2403.15989</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib24"><label>24</label><mixed-citation>Klotz, D., Herrnegger, M., and Schulz, K.: Symbolic Regression for the Estimation of Transfer Functions of Hydrological Models, Water Resour. Res., 53, 9402–9423, <ext-link xlink:href="https://doi.org/10.1002/2017wr021253" ext-link-type="DOI">10.1002/2017wr021253</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib25"><label>25</label><mixed-citation>Koza, J. R.: Genetic programming as a means for programming computers by natural selection, Stat. Comput., 4, 87–112, <ext-link xlink:href="https://doi.org/10.1007/BF00175355" ext-link-type="DOI">10.1007/BF00175355</ext-link>, 1994.</mixed-citation></ref>
      <ref id="bib1.bib26"><label>26</label><mixed-citation>Kratzert, F., Klotz, D., Shalev, G., Klambauer, G., Hochreiter, S., and Nearing, G.: Towards learning universal, regional, and local hydrological behaviors via machine learning applied to large-sample datasets, Hydrol. Earth Syst. Sci., 23, 5089–5110, <ext-link xlink:href="https://doi.org/10.5194/hess-23-5089-2019" ext-link-type="DOI">10.5194/hess-23-5089-2019</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib27"><label>27</label><mixed-citation>Kronberger, G., de Franca, F. O., Burlacu, B., Haider, C., and Kommenda, M.: Shape-Constrained Symbolic Regression – Improving Extrapolation with Prior Knowledge, Evol. Comput., 30, 75–98, <ext-link xlink:href="https://doi.org/10.1162/evco_a_00294" ext-link-type="DOI">10.1162/evco_a_00294</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib28"><label>28</label><mixed-citation>Li, Q., Zhang, C., Wei, Z., Jin, X., Shangguan, W., Yuan, H., Zhu, J., Li, L., Liu, P., Chen, X., Yan, Y., and Dai, Y.: Advancing symbolic regression for earth science with a focus on evapotranspiration modeling, npj Climate and Atmospheric Science, 7, <ext-link xlink:href="https://doi.org/10.1038/s41612-024-00861-5" ext-link-type="DOI">10.1038/s41612-024-00861-5</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib29"><label>29</label><mixed-citation>Li, X., Zhang, J., Li, D., Liu, X., Xu, J., and Yin, J.: UniSymNet: A Unified Symbolic Network Guided by Transformer, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2505.06091" ext-link-type="DOI">10.48550/arXiv.2505.06091</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bib30"><label>30</label><mixed-citation>Lin, Y., Mei, Y., and Wang, D.: Data and code archive for “Regionalization of Optimal Baseflow Separation using Catchment-scale Characteristics”, Zenodo [data set/code], <ext-link xlink:href="https://doi.org/10.5281/zenodo.16924118" ext-link-type="DOI">10.5281/zenodo.16924118</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bib31"><label>31</label><mixed-citation>Lin, Y., Mei, Y., Wang, D., Zhu, J., Wu, H., Wang, S., Yin, G., Gao, L., and N. Anagnostou, E.: Regionalization of Optimal Baseflow Separation using Catchment-scale Characteristics, Water Resour. Res., 62, <ext-link xlink:href="https://doi.org/10.1029/2025WR040578" ext-link-type="DOI">10.1029/2025WR040578</ext-link>, 2026.</mixed-citation></ref>
      <ref id="bib1.bib32"><label>32</label><mixed-citation>Makke, N. and Chawla, S.: Interpretable scientific discovery with symbolic regression: a review, Artif. Intell. Rev., 57, <ext-link xlink:href="https://doi.org/10.1007/s10462-023-10622-0" ext-link-type="DOI">10.1007/s10462-023-10622-0</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib33"><label>33</label><mixed-citation>McGlynn, B. L., McDonnell, J. J., Seibert, J., and Kendall, C.: Scale effects on headwater catchment runoff timing, flow sources, and groundwater-streamflow relations, Water Resour. Res., 40, <ext-link xlink:href="https://doi.org/10.1029/2003WR002494" ext-link-type="DOI">10.1029/2003WR002494</ext-link>, 2004.</mixed-citation></ref>
      <ref id="bib1.bib34"><label>34</label><mixed-citation>McMahon, T. A. and Nathan, R. J.: Baseflow and transmission loss: A review, WIREs Water, 8, e1527, <ext-link xlink:href="https://doi.org/10.1002/wat2.1527" ext-link-type="DOI">10.1002/wat2.1527</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib35"><label>35</label><mixed-citation>McMillan, H.: Linking hydrologic signatures to hydrologic processes: A review, Hydrol. Process., 34, 1393–1409, <ext-link xlink:href="https://doi.org/10.1002/hyp.13632" ext-link-type="DOI">10.1002/hyp.13632</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib36"><label>36</label><mixed-citation>McMillan, H. K., Gnann, S. J., and Araki, R.: Large Scale Evaluation of Relationships Between Hydrologic Signatures and Processes, Water Resour. Res., 58, e2021WR031751, <ext-link xlink:href="https://doi.org/10.1029/2021WR031751" ext-link-type="DOI">10.1029/2021WR031751</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib37"><label>37</label><mixed-citation>Mei, Y. and Anagnostou, E. N.: A hydrograph separation method based on information from rainfall and runoff records, J. Hydrol., 523, 636–649, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2015.01.083" ext-link-type="DOI">10.1016/j.jhydrol.2015.01.083</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib38"><label>38</label><mixed-citation>Mei, Y., Zhu, J., and Wang, D.: Data and Code Archive for “Optimal Baseflow Separation through Chemical Mass Balance: Comparing the Usages of Two Tracers, Two Concentration Estimation Methods, and Four Baseflow Filters”, Zenodo [data set/code], <ext-link xlink:href="https://doi.org/10.5281/zenodo.8388365" ext-link-type="DOI">10.5281/zenodo.8388365</ext-link>, 2024a.</mixed-citation></ref>
      <ref id="bib1.bib39"><label>39</label><mixed-citation>Mei, Y., Wang, D., Zhu, J., Tang, G., Cai, C., Shen, X., Hong, Y., and Zhang, X.: Optimal Baseflow Separation Through Chemical Mass Balance: Comparing the Usages of Two Tracers, Two Concentration Estimation Methods, and Four Baseflow Filters, Water Resour. Res., 60, <ext-link xlink:href="https://doi.org/10.1029/2023wr036386" ext-link-type="DOI">10.1029/2023wr036386</ext-link>, 2024b.</mixed-citation></ref>
      <ref id="bib1.bib40"><label>40</label><mixed-citation>Nagy, E. D., Szilagyi, J., and Torma, P.: Calibrating the lyne-hollick filter for baseflow separation based on catchment response time, J. Hydrol., 638, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2024.131483" ext-link-type="DOI">10.1016/j.jhydrol.2024.131483</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib41"><label>41</label><mixed-citation>Noor, K., Marttila, H., Welker, J. M., Mustonen, K.-R., Kløve, B., and Ala-aho, P.: Snow sampling strategy can bias estimation of meltwater fractions in isotope hydrograph separation, J. Hydrol., 627, 130429, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2023.130429" ext-link-type="DOI">10.1016/j.jhydrol.2023.130429</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib42"><label>42</label><mixed-citation>Pelletier, A. and Andréassian, V.: Hydrograph separation: an impartial parametrisation for an imperfect method, Hydrol. Earth Syst. Sci., 24, 1171–1187, <ext-link xlink:href="https://doi.org/10.5194/hess-24-1171-2020" ext-link-type="DOI">10.5194/hess-24-1171-2020</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib43"><label>43</label><mixed-citation>Piggott, A. R., Moin, S., and Southam, C.: A revised approach to the UKIH method for the calculation of baseflow  [Une approche améliorée de la méthode de l'UKIH pour le calcul de l'écoulement de base], Hydrolog. Sci. J., 50,  920, <ext-link xlink:href="https://doi.org/10.1623/hysj.2005.50.5.911" ext-link-type="DOI">10.1623/hysj.2005.50.5.911</ext-link>, 2005.</mixed-citation></ref>
      <ref id="bib1.bib44"><label>44</label><mixed-citation>Price, K.: Effects of watershed topography, soils, land use, and climate on baseflow hydrology in humid regions: A review, Prog. Phys. Geog., 35, 465–492, <ext-link xlink:href="https://doi.org/10.1177/0309133311402714" ext-link-type="DOI">10.1177/0309133311402714</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib45"><label>45</label><mixed-citation>Rudin, C.: Stop Explaining Black Box Machine Learning Models for High Stakes Decisions and Use Interpretable Models Instead, Nat. Mach. Intell., 1, 206–215, <ext-link xlink:href="https://doi.org/10.1038/s42256-019-0048-x" ext-link-type="DOI">10.1038/s42256-019-0048-x</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib46"><label>46</label><mixed-citation>Samaniego, L., Kumar, R., and Attinger, S.: Multiscale parameter regionalization of a grid-based hydrologic model at the mesoscale, Water Resour. Res., 46, <ext-link xlink:href="https://doi.org/10.1029/2008WR007327" ext-link-type="DOI">10.1029/2008WR007327</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib47"><label>47</label><mixed-citation> Sheta, A., Abdel-raouf, A., Fraihat, K., and Baareh, A. K.: Evolutionary Design of a PSO-Tuned Multigene Symbolic Regression Genetic Programming Model for River Flow Forecasting, International Journal of Advanced Computer Science and Applications, 14, 2023, 10.14569/IJACSA.2023.0140489, 2023.</mixed-citation></ref>
      <ref id="bib1.bib48"><label>48</label><mixed-citation>Sólyom, P. B. and Tucker, G. E.: The importance of the catchment area–length relationship in governing non-steady state hydrology, optimal junction angles and drainage network pattern, Geomorphology, 88, 84–108, <ext-link xlink:href="https://doi.org/10.1016/j.geomorph.2006.10.014" ext-link-type="DOI">10.1016/j.geomorph.2006.10.014</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib49"><label>49</label><mixed-citation>Song, W., Jiang, S., Camps-Valls, G., Williams, M., Zhang, L., Reichstein, M., Vereecken, H., He, L., Hu, X., and Shi, L.: Towards data-driven discovery of governing equations in geosciences, Commun. Earth Environ., 5, 589, <ext-link xlink:href="https://doi.org/10.1038/s43247-024-01760-6" ext-link-type="DOI">10.1038/s43247-024-01760-6</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib50"><label>50</label><mixed-citation>Stewart, M. K.: Promising new baseflow separation and recession analysis methods applied to streamflow at Glendhu Catchment, New Zealand, Hydrol. Earth Syst. Sci., 19, 2587–2603, <ext-link xlink:href="https://doi.org/10.5194/hess-19-2587-2015" ext-link-type="DOI">10.5194/hess-19-2587-2015</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib51"><label>51</label><mixed-citation>Stoelzle, M., Schuetz, T., Weiler, M., Stahl, K., and Tallaksen, L. M.: Beyond binary baseflow separation: a delayed-flow index for multiple streamflow contributions, Hydrol. Earth Syst. Sci., 24, 849–867, <ext-link xlink:href="https://doi.org/10.5194/hess-24-849-2020" ext-link-type="DOI">10.5194/hess-24-849-2020</ext-link>, 2020. </mixed-citation></ref>
      <ref id="bib1.bib52"><label>52</label><mixed-citation>Sundararajan, M. and Najmi, A.: The Many Shapley Values for Model Explanation, Proceedings of the 37th International Conference on Machine Learning, Proceedings of Machine Learning Research (PMLR), 119, <uri>https://proceedings.mlr.press/v119/sundararajan20b.html</uri> (last access: 29 May 2026), 2020.</mixed-citation></ref>
      <ref id="bib1.bib53"><label>53</label><mixed-citation>Tan, X., Liu, B., and Tan, X.: Global Changes in Baseflow Under the Impacts of Changing Climate and Vegetation, Water Resour. Res., 56, e2020WR027349, <ext-link xlink:href="https://doi.org/10.1029/2020WR027349" ext-link-type="DOI">10.1029/2020WR027349</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib54"><label>54</label><mixed-citation>Tarasova, L., Gnann, S., Yang, S., Hartmann, A., and Wagener, T.: Catchment characterization: Current descriptors, knowledge gaps and future opportunities, Earth-Sci. Rev., 252, <ext-link xlink:href="https://doi.org/10.1016/j.earscirev.2024.104739" ext-link-type="DOI">10.1016/j.earscirev.2024.104739</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib55"><label>55</label><mixed-citation>Thorslund, J. and van Vliet, M. T. H.: A global dataset of surface water and groundwater salinity measurements from 1980–2019, Scientific Data, 7, 231, <ext-link xlink:href="https://doi.org/10.1038/s41597-020-0562-z" ext-link-type="DOI">10.1038/s41597-020-0562-z</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib56"><label>56</label><mixed-citation>Wang, C., Gomez-Velez, J. D., and Wilson, J. L.: Dynamic coevolution of baseflow and multiscale groundwater flow system during prolonged droughts, J. Hydrol., 609, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2022.127657" ext-link-type="DOI">10.1016/j.jhydrol.2022.127657</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib57"><label>57</label><mixed-citation>Wilstrup, C. and Kasak, J.: Symbolic regression outperforms other models for small data sets, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2103.15147" ext-link-type="DOI">10.48550/arXiv.2103.15147</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib58"><label>58</label><mixed-citation>Wu, S., Zhao, J., Wang, H., and Sivapalan, M.: Regional Patterns and Physical Controls of Streamflow Generation Across the Conterminous United States, Water Resour. Res., 57, <ext-link xlink:href="https://doi.org/10.1029/2020wr028086" ext-link-type="DOI">10.1029/2020wr028086</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib59"><label>59</label><mixed-citation>Xie, J., Liu, X., Tian, W., Wang, K., Bai, P., and Liu, C.: Estimating Gridded Monthly Baseflow From 1981 to 2020 for the Contiguous US Using Long Short-Term Memory (LSTM) Networks, Water Resour. Res., 58, <ext-link xlink:href="https://doi.org/10.1029/2021wr031663" ext-link-type="DOI">10.1029/2021wr031663</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib60"><label>60</label><mixed-citation>Xie, J., Liu, X., Wang, K., Yang, T., Liang, K., and Liu, C.: Evaluation of typical methods for baseflow separation in the contiguous United States, J. Hydrol., 583, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2020.124628" ext-link-type="DOI">10.1016/j.jhydrol.2020.124628</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib61"><label>61</label><mixed-citation>Xie, J., Liu, X., Jasechko, S., Berghuijs, W. R., Wang, K., Liu, C., Reichstein, M., Jung, M., and Koirala, S.: Majority of global river flow sustained by groundwater, Nat. Geosci., <ext-link xlink:href="https://doi.org/10.1038/s41561-024-01483-5" ext-link-type="DOI">10.1038/s41561-024-01483-5</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib62"><label>62</label><mixed-citation>Yan, X., Sun, J., Huang, Y., Xia, Y., Wang, Z., and Li, Z.: Detecting and attributing the changes in baseflow in China's Loess Plateau, J. Hydrol., 617, 128957, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2022.128957" ext-link-type="DOI">10.1016/j.jhydrol.2022.128957</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib63"><label>63</label><mixed-citation>Zhang, J., Zhang, Y., Song, J., and Cheng, L.: Evaluating relative merits of four baseflow separation methods in Eastern Australia, J. Hydrol., 549, 252–263, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2017.04.004" ext-link-type="DOI">10.1016/j.jhydrol.2017.04.004</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib64"><label>64</label><mixed-citation>Zhang, J., Zhang, Y., Song, J., Cheng, L., Kumar Paul, P., Gan, R., Shi, X., Luo, Z., and Zhao, P.: Large-scale baseflow index prediction using hydrological modelling, linear and multilevel regression approaches, J. Hydrol., 585, 124780, <ext-link xlink:href="https://doi.org/10.1016/j.jhydrol.2020.124780" ext-link-type="DOI">10.1016/j.jhydrol.2020.124780</ext-link>, 2020.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>Symbolic regression-based regionalization of baseflow separation parameter using catchment-scale characteristics</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>1</label><mixed-citation>
      
Aksoy, H., Unal, N. E., and Pektas, A. O.: Smoothed minima baseflow
separation tool for perennial and intermittent streams, Hydrol.
Process., 22, 4467–4476, <a href="https://doi.org/10.1002/hyp.7077" target="_blank">https://doi.org/10.1002/hyp.7077</a>, 2008.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>2</label><mixed-citation>
      
Apley, D. W. and Zhu, J.: Visualizing the Effects of Predictor Variables in
Black Box Supervised Learning Models, J. Roy. Stat.
Soc. B, 82, 1059–1086,
10.1111/rssb.12377, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>3</label><mixed-citation>
      
Barnhart, T. B., Molotch, N. P., Livneh, B., Harpold, A. A., Knowles, J. F.,
and Schneider, D.: Snowmelt rate dictates streamflow, Geophys. Res.
Lett., 43, 8006–8016, <a href="https://doi.org/10.1002/2016GL069690" target="_blank">https://doi.org/10.1002/2016GL069690</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>4</label><mixed-citation>
      
Beven, K. and Germann, P.: Macropores and water flow in soils revisited,
Water Resour. Res., 49, 3071–3092, <a href="https://doi.org/10.1002/wrcr.20156" target="_blank">https://doi.org/10.1002/wrcr.20156</a>,
2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>5</label><mixed-citation>
      
Cartwright, I.: Implications of variations in stream specific conductivity for estimating baseflow using chemical mass balance and calibrated hydrograph techniques, Hydrol. Earth Syst. Sci., 26, 183–195, <a href="https://doi.org/10.5194/hess-26-183-2022" target="_blank">https://doi.org/10.5194/hess-26-183-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>6</label><mixed-citation>
      
Chadalawada, J., Herath, H. M. V. V., and Babovic, V.: Hydrologically
Informed Machine Learning for Rainfall-Runoff Modeling: A Genetic
Programming-Based Toolkit for Automatic Model Induction, Water Resour.
Res., 56, e2019WR026933, <a href="https://doi.org/10.1029/2019WR026933" target="_blank">https://doi.org/10.1029/2019WR026933</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>7</label><mixed-citation>
      
Cranmer, M.: Interpretable machine learning for science with PySR and
SymbolicRegression.jl, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.2305.01582" target="_blank">https://doi.org/10.48550/arXiv.2305.01582</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>8</label><mixed-citation>
      
Diebold, F. X. and Mariano, R. S.: Comparing Predictive Accuracy, J.
Bus. Econ. Stat., 13, 253–263,
10.1080/07350015.1995.10524599, 1995.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>9</label><mixed-citation>
      
Elsken, T., Metzen, J. H., and Hutter, F.: Neural architecture search: a
survey, J. Mach. Learn. Res., 20, 1997–2017, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>10</label><mixed-citation>
      
Feigl, M., Herrnegger, M., Klotz, D., and Schulz, K.: Function Space
Optimization: A Symbolic Regression Method for Estimating Parameter Transfer
Functions for Hydrological Models, Water Resour. Res., 56, e2020WR027385,
10.1029/2020WR027385, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>11</label><mixed-citation>
      
Feigl, M., Thober, S., Schweppe, R., Herrnegger, M., Samaniego, L., and
Schulz, K.: Automatic Regionalization of Model Parameters for Hydrological
Models, Water Resour. Res., 58, e2022WR031966,
<a href="https://doi.org/10.1029/2022WR031966" target="_blank">https://doi.org/10.1029/2022WR031966</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>12</label><mixed-citation>
      
Feng, D., Fang, K., and Shen, C.: Enhancing Streamflow Forecast and
Extracting Insights Using Long-Short Term Memory Networks With Data
Integration at Continental Scales, Water Resour. Res., 56,
e2019WR026793, <a href="https://doi.org/10.1029/2019wr026793" target="_blank">https://doi.org/10.1029/2019wr026793</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>13</label><mixed-citation>
      
Garzon, L. F. L., Johnson, M. F., Mount, N., and Gomez, H.: Exploring the
effects of catchment morphometry on overland flow response to extreme
rainfall using a 2D hydraulic-hydrological model (IBER), J.
Hydrol., 627, 130405, <a href="https://doi.org/10.1016/j.jhydrol.2023.130405" target="_blank">https://doi.org/10.1016/j.jhydrol.2023.130405</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>14</label><mixed-citation>
      
Gnann, S. J., McMillan, H. K., Woods, R. A., and Howden, N. J. K.: Including
Regional Knowledge Improves Baseflow Signature Predictions in Large Sample
Hydrology, Water Resour. Res., 57, e2020WR028354,
<a href="https://doi.org/10.1029/2020WR028354" target="_blank">https://doi.org/10.1029/2020WR028354</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>15</label><mixed-citation>
      
Godsey, S. E., Kirchner, J. W., and Tague, C. L.: Effects of changes in
winter snowpacks on summer low flows: case studies in the Sierra Nevada,
California, USA, Hydrol. Process., 28, 5048–5064,
<a href="https://doi.org/10.1002/hyp.9943" target="_blank">https://doi.org/10.1002/hyp.9943</a>, 2014.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>16</label><mixed-citation>
      
Gupta, H. V., Kling, H., Yilmaz, K. K., and Martinez, G. F.: Decomposition
of the mean squared error and NSE performance criteria: Implications for
improving hydrological modelling, J. Hydrol., 377, 80–91,
10.1016/j.jhydrol.2009.08.003, 2009.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>17</label><mixed-citation>
      
Gustard, A., Bullock, A. D., and Dixon, J. M.: Low Flow Estimation in the
United Kingdom, Institute of Hydrology, Wallingford, UK, ISBN&thinsp;0948540451, 1992.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>18</label><mixed-citation>
      
Häfner, D., Gemmrich, J., and Jochum, M.: Machine-guided discovery of a
real-world rogue wave model, P. Natl. Acad.
Sci. USA, 120, e2306275120, <a href="https://doi.org/10.1073/pnas.2306275120" target="_blank">https://doi.org/10.1073/pnas.2306275120</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>19</label><mixed-citation>
      
Hagedorn, B.: Hydrograph separation through multi objective optimization:
Revealing the importance of a temporally and spatially constrained baseflow
solute source, J. Hydrol., 590, 125349,
<a href="https://doi.org/10.1016/j.jhydrol.2020.125349" target="_blank">https://doi.org/10.1016/j.jhydrol.2020.125349</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>20</label><mixed-citation>
      
Hou, X., Xie, D., Feng, L., Shen, F., and Nienhuis, J. H.: Sustained
increase in suspended sediments near global river deltas over the past two
decades, Nat. Commun., 15, 3319, <a href="https://doi.org/10.1038/s41467-024-47598-6" target="_blank">https://doi.org/10.1038/s41467-024-47598-6</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>21</label><mixed-citation>
      
Humphrey, C. E., Solomon, D. K., Genereux, D. P., Gilmore, T. E.,
Mittelstet, A. R., Zlotnik, V. A., Zeyrek, C., Jensen, C. R., and MacNamara,
M. R.: Using Automated Seepage Meters to Quantify the Spatial Variability
and Net Flux of Groundwater to a Stream, Water Resour. Res., 58,
e2021WR030711, <a href="https://doi.org/10.1029/2021WR030711" target="_blank">https://doi.org/10.1029/2021WR030711</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>22</label><mixed-citation>
      
Jenicek, M. and Ledvinka, O.: Importance of snowmelt contribution to seasonal runoff and summer low flows in Czechia, Hydrol. Earth Syst. Sci., 24, 3475–3491, <a href="https://doi.org/10.5194/hess-24-3475-2020" target="_blank">https://doi.org/10.5194/hess-24-3475-2020</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>23</label><mixed-citation>
      
Karpatne, A., Jia, X., and Kumar, V.: Knowledge-guided machine learning:
Current trends and future prospects, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.2403.15989" target="_blank">https://doi.org/10.48550/arXiv.2403.15989</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>24</label><mixed-citation>
      
Klotz, D., Herrnegger, M., and Schulz, K.: Symbolic Regression for the
Estimation of Transfer Functions of Hydrological Models, Water Resour.
Res., 53, 9402–9423, <a href="https://doi.org/10.1002/2017wr021253" target="_blank">https://doi.org/10.1002/2017wr021253</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>25</label><mixed-citation>
      
Koza, J. R.: Genetic programming as a means for programming computers by
natural selection, Stat. Comput., 4, 87–112, <a href="https://doi.org/10.1007/BF00175355" target="_blank">https://doi.org/10.1007/BF00175355</a>,
1994.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>26</label><mixed-citation>
      
Kratzert, F., Klotz, D., Shalev, G., Klambauer, G., Hochreiter, S., and Nearing, G.: Towards learning universal, regional, and local hydrological behaviors via machine learning applied to large-sample datasets, Hydrol. Earth Syst. Sci., 23, 5089–5110, <a href="https://doi.org/10.5194/hess-23-5089-2019" target="_blank">https://doi.org/10.5194/hess-23-5089-2019</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>27</label><mixed-citation>
      
Kronberger, G., de Franca, F. O., Burlacu, B., Haider, C., and Kommenda, M.:
Shape-Constrained Symbolic Regression – Improving Extrapolation with Prior
Knowledge, Evol. Comput., 30, 75–98, <a href="https://doi.org/10.1162/evco_a_00294" target="_blank">https://doi.org/10.1162/evco_a_00294</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>28</label><mixed-citation>
      
Li, Q., Zhang, C., Wei, Z., Jin, X., Shangguan, W., Yuan, H., Zhu, J., Li,
L., Liu, P., Chen, X., Yan, Y., and Dai, Y.: Advancing symbolic regression
for earth science with a focus on evapotranspiration modeling, npj Climate
and Atmospheric Science, 7, <a href="https://doi.org/10.1038/s41612-024-00861-5" target="_blank">https://doi.org/10.1038/s41612-024-00861-5</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>29</label><mixed-citation>
      
Li, X., Zhang, J., Li, D., Liu, X., Xu, J., and Yin, J.: UniSymNet: A
Unified Symbolic Network Guided by Transformer, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.2505.06091" target="_blank">https://doi.org/10.48550/arXiv.2505.06091</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>30</label><mixed-citation>
      
Lin, Y., Mei, Y., and Wang, D.: Data and code archive for “Regionalization
of Optimal Baseflow Separation using Catchment-scale Characteristics”, Zenodo [data set/code], <a href="https://doi.org/10.5281/zenodo.16924118" target="_blank">https://doi.org/10.5281/zenodo.16924118</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>31</label><mixed-citation>
      
Lin, Y., Mei, Y., Wang, D., Zhu, J., Wu, H., Wang, S., Yin, G., Gao, L., and
N. Anagnostou, E.: Regionalization of Optimal Baseflow Separation using
Catchment-scale Characteristics, Water Resour. Res., 62, <a href="https://doi.org/10.1029/2025WR040578" target="_blank">https://doi.org/10.1029/2025WR040578</a>, 2026.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>32</label><mixed-citation>
      
Makke, N. and Chawla, S.: Interpretable scientific discovery with symbolic
regression: a review, Artif. Intell. Rev., 57,
<a href="https://doi.org/10.1007/s10462-023-10622-0" target="_blank">https://doi.org/10.1007/s10462-023-10622-0</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>33</label><mixed-citation>
      
McGlynn, B. L., McDonnell, J. J., Seibert, J., and Kendall, C.: Scale
effects on headwater catchment runoff timing, flow sources, and
groundwater-streamflow relations, Water Resour. Res., 40,
<a href="https://doi.org/10.1029/2003WR002494" target="_blank">https://doi.org/10.1029/2003WR002494</a>, 2004.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>34</label><mixed-citation>
      
McMahon, T. A. and Nathan, R. J.: Baseflow and transmission loss: A review,
WIREs Water, 8, e1527, <a href="https://doi.org/10.1002/wat2.1527" target="_blank">https://doi.org/10.1002/wat2.1527</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>35</label><mixed-citation>
      
McMillan, H.: Linking hydrologic signatures to hydrologic processes: A
review, Hydrol. Process., 34, 1393–1409,
<a href="https://doi.org/10.1002/hyp.13632" target="_blank">https://doi.org/10.1002/hyp.13632</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>36</label><mixed-citation>
      
McMillan, H. K., Gnann, S. J., and Araki, R.: Large Scale Evaluation of
Relationships Between Hydrologic Signatures and Processes, Water Resour.
Res., 58, e2021WR031751, <a href="https://doi.org/10.1029/2021WR031751" target="_blank">https://doi.org/10.1029/2021WR031751</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>37</label><mixed-citation>
      
Mei, Y. and Anagnostou, E. N.: A hydrograph separation method based on
information from rainfall and runoff records, J. Hydrol., 523,
636–649, <a href="https://doi.org/10.1016/j.jhydrol.2015.01.083" target="_blank">https://doi.org/10.1016/j.jhydrol.2015.01.083</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>38</label><mixed-citation>
      
Mei, Y., Zhu, J., and Wang, D.: Data and Code Archive for “Optimal Baseflow
Separation through Chemical Mass Balance: Comparing the Usages of Two
Tracers, Two Concentration Estimation Methods, and Four Baseflow Filters”, Zenodo [data set/code], <a href="https://doi.org/10.5281/zenodo.8388365" target="_blank">https://doi.org/10.5281/zenodo.8388365</a>, 2024a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>39</label><mixed-citation>
      
Mei, Y., Wang, D., Zhu, J., Tang, G., Cai, C., Shen, X., Hong, Y., and
Zhang, X.: Optimal Baseflow Separation Through Chemical Mass Balance:
Comparing the Usages of Two Tracers, Two Concentration Estimation Methods,
and Four Baseflow Filters, Water Resour. Res., 60,
<a href="https://doi.org/10.1029/2023wr036386" target="_blank">https://doi.org/10.1029/2023wr036386</a>, 2024b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>40</label><mixed-citation>
      
Nagy, E. D., Szilagyi, J., and Torma, P.: Calibrating the lyne-hollick
filter for baseflow separation based on catchment response time, J.
Hydrol., 638, <a href="https://doi.org/10.1016/j.jhydrol.2024.131483" target="_blank">https://doi.org/10.1016/j.jhydrol.2024.131483</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>41</label><mixed-citation>
      
Noor, K., Marttila, H., Welker, J. M., Mustonen, K.-R., Kløve, B., and
Ala-aho, P.: Snow sampling strategy can bias estimation of meltwater
fractions in isotope hydrograph separation, J. Hydrol., 627,
130429, <a href="https://doi.org/10.1016/j.jhydrol.2023.130429" target="_blank">https://doi.org/10.1016/j.jhydrol.2023.130429</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>42</label><mixed-citation>
      
Pelletier, A. and Andréassian, V.: Hydrograph separation: an impartial parametrisation for an imperfect method, Hydrol. Earth Syst. Sci., 24, 1171–1187, <a href="https://doi.org/10.5194/hess-24-1171-2020" target="_blank">https://doi.org/10.5194/hess-24-1171-2020</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>43</label><mixed-citation>
      
Piggott, A. R., Moin, S., and Southam, C.: A revised approach to the UKIH
method for the calculation of baseflow  [Une approche améliorée de
la méthode de l'UKIH pour le calcul de l'écoulement de base],
Hydrolog. Sci. J., 50,  920, <a href="https://doi.org/10.1623/hysj.2005.50.5.911" target="_blank">https://doi.org/10.1623/hysj.2005.50.5.911</a>,
2005.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>44</label><mixed-citation>
      
Price, K.: Effects of watershed topography, soils, land use, and climate on
baseflow hydrology in humid regions: A review, Prog. Phys.
Geog., 35, 465–492, <a href="https://doi.org/10.1177/0309133311402714" target="_blank">https://doi.org/10.1177/0309133311402714</a>,
2011.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>45</label><mixed-citation>
      
Rudin, C.: Stop Explaining Black Box Machine Learning Models for High Stakes
Decisions and Use Interpretable Models Instead, Nat. Mach. Intell., 1, 206–215,
<a href="https://doi.org/10.1038/s42256-019-0048-x" target="_blank">https://doi.org/10.1038/s42256-019-0048-x</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>46</label><mixed-citation>
      
Samaniego, L., Kumar, R., and Attinger, S.: Multiscale parameter
regionalization of a grid-based hydrologic model at the mesoscale, Water
Resour. Res., 46, <a href="https://doi.org/10.1029/2008WR007327" target="_blank">https://doi.org/10.1029/2008WR007327</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>47</label><mixed-citation>
      
Sheta, A., Abdel-raouf, A., Fraihat, K., and Baareh, A. K.: Evolutionary
Design of a PSO-Tuned Multigene Symbolic Regression Genetic Programming
Model for River Flow Forecasting, International Journal of Advanced Computer
Science and Applications, 14, 2023, 10.14569/IJACSA.2023.0140489, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>48</label><mixed-citation>
      
Sólyom, P. B. and Tucker, G. E.: The importance of the catchment
area–length relationship in governing non-steady state hydrology, optimal
junction angles and drainage network pattern, Geomorphology, 88, 84–108,
<a href="https://doi.org/10.1016/j.geomorph.2006.10.014" target="_blank">https://doi.org/10.1016/j.geomorph.2006.10.014</a>, 2007.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>49</label><mixed-citation>
      
Song, W., Jiang, S., Camps-Valls, G., Williams, M., Zhang, L., Reichstein,
M., Vereecken, H., He, L., Hu, X., and Shi, L.: Towards data-driven
discovery of governing equations in geosciences, Commun. Earth Environ., 5, 589, <a href="https://doi.org/10.1038/s43247-024-01760-6" target="_blank">https://doi.org/10.1038/s43247-024-01760-6</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>50</label><mixed-citation>
      
Stewart, M. K.: Promising new baseflow separation and recession analysis methods applied to streamflow at Glendhu Catchment, New Zealand, Hydrol. Earth Syst. Sci., 19, 2587–2603, <a href="https://doi.org/10.5194/hess-19-2587-2015" target="_blank">https://doi.org/10.5194/hess-19-2587-2015</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib51"><label>51</label><mixed-citation>
      
Stoelzle, M., Schuetz, T., Weiler, M., Stahl, K., and Tallaksen, L. M.: Beyond binary baseflow separation: a delayed-flow index for multiple streamflow contributions, Hydrol. Earth Syst. Sci., 24, 849–867, <a href="https://doi.org/10.5194/hess-24-849-2020" target="_blank">https://doi.org/10.5194/hess-24-849-2020</a>, 2020.


    </mixed-citation></ref-html>
<ref-html id="bib1.bib52"><label>52</label><mixed-citation>
      
Sundararajan, M. and Najmi, A.: The Many Shapley Values for Model
Explanation, Proceedings of the 37th International Conference on Machine
Learning, Proceedings of Machine Learning Research (PMLR), 119, <a href="https://proceedings.mlr.press/v119/sundararajan20b.html" target="_blank"/> (last access: 29 May 2026), 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib53"><label>53</label><mixed-citation>
      
Tan, X., Liu, B., and Tan, X.: Global Changes in Baseflow Under the Impacts
of Changing Climate and Vegetation, Water Resour. Res., 56,
e2020WR027349, <a href="https://doi.org/10.1029/2020WR027349" target="_blank">https://doi.org/10.1029/2020WR027349</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib54"><label>54</label><mixed-citation>
      
Tarasova, L., Gnann, S., Yang, S., Hartmann, A., and Wagener, T.: Catchment
characterization: Current descriptors, knowledge gaps and future
opportunities, Earth-Sci. Rev., 252, <a href="https://doi.org/10.1016/j.earscirev.2024.104739" target="_blank">https://doi.org/10.1016/j.earscirev.2024.104739</a>,
2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib55"><label>55</label><mixed-citation>
      
Thorslund, J. and van Vliet, M. T. H.: A global dataset of surface water and
groundwater salinity measurements from 1980–2019, Scientific Data, 7, 231,
<a href="https://doi.org/10.1038/s41597-020-0562-z" target="_blank">https://doi.org/10.1038/s41597-020-0562-z</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib56"><label>56</label><mixed-citation>
      
Wang, C., Gomez-Velez, J. D., and Wilson, J. L.: Dynamic coevolution of
baseflow and multiscale groundwater flow system during prolonged droughts,
J. Hydrol., 609, <a href="https://doi.org/10.1016/j.jhydrol.2022.127657" target="_blank">https://doi.org/10.1016/j.jhydrol.2022.127657</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib57"><label>57</label><mixed-citation>
      
Wilstrup, C. and Kasak, J.: Symbolic regression outperforms other models for
small data sets, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.2103.15147" target="_blank">https://doi.org/10.48550/arXiv.2103.15147</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib58"><label>58</label><mixed-citation>
      
Wu, S., Zhao, J., Wang, H., and Sivapalan, M.: Regional Patterns and
Physical Controls of Streamflow Generation Across the Conterminous United
States, Water Resour. Res., 57, <a href="https://doi.org/10.1029/2020wr028086" target="_blank">https://doi.org/10.1029/2020wr028086</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib59"><label>59</label><mixed-citation>
      
Xie, J., Liu, X., Tian, W., Wang, K., Bai, P., and Liu, C.: Estimating
Gridded Monthly Baseflow From 1981 to 2020 for the Contiguous US Using Long
Short-Term Memory (LSTM) Networks, Water Resour. Res., 58,
<a href="https://doi.org/10.1029/2021wr031663" target="_blank">https://doi.org/10.1029/2021wr031663</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib60"><label>60</label><mixed-citation>
      
Xie, J., Liu, X., Wang, K., Yang, T., Liang, K., and Liu, C.: Evaluation of
typical methods for baseflow separation in the contiguous United States,
J. Hydrol., 583, <a href="https://doi.org/10.1016/j.jhydrol.2020.124628" target="_blank">https://doi.org/10.1016/j.jhydrol.2020.124628</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib61"><label>61</label><mixed-citation>
      
Xie, J., Liu, X., Jasechko, S., Berghuijs, W. R., Wang, K., Liu, C.,
Reichstein, M., Jung, M., and Koirala, S.: Majority of global river flow
sustained by groundwater, Nat. Geosci., <a href="https://doi.org/10.1038/s41561-024-01483-5" target="_blank">https://doi.org/10.1038/s41561-024-01483-5</a>,
2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib62"><label>62</label><mixed-citation>
      
Yan, X., Sun, J., Huang, Y., Xia, Y., Wang, Z., and Li, Z.: Detecting and
attributing the changes in baseflow in China's Loess Plateau, J.
Hydrol., 617, 128957, <a href="https://doi.org/10.1016/j.jhydrol.2022.128957" target="_blank">https://doi.org/10.1016/j.jhydrol.2022.128957</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib63"><label>63</label><mixed-citation>
      
Zhang, J., Zhang, Y., Song, J., and Cheng, L.: Evaluating relative merits of
four baseflow separation methods in Eastern Australia, J. Hydrol.,
549, 252–263, <a href="https://doi.org/10.1016/j.jhydrol.2017.04.004" target="_blank">https://doi.org/10.1016/j.jhydrol.2017.04.004</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib64"><label>64</label><mixed-citation>
      
Zhang, J., Zhang, Y., Song, J., Cheng, L., Kumar Paul, P., Gan, R., Shi, X.,
Luo, Z., and Zhao, P.: Large-scale baseflow index prediction using
hydrological modelling, linear and multilevel regression approaches, J.
Hydrol., 585, 124780, <a href="https://doi.org/10.1016/j.jhydrol.2020.124780" target="_blank">https://doi.org/10.1016/j.jhydrol.2020.124780</a>,
2020.

    </mixed-citation></ref-html>--></article>
