<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="data-paper">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">ESSD</journal-id><journal-title-group>
    <journal-title>Earth System Science Data</journal-title>
    <abbrev-journal-title abbrev-type="publisher">ESSD</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Earth Syst. Sci. Data</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1866-3516</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/essd-17-43-2025</article-id><title-group><article-title>A machine-learning reconstruction of sea surface <inline-formula><mml:math id="M1" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the North American Atlantic Coastal Ocean Margin from 1993 to 2021</article-title><alt-title>A machine-learning reconstruction of coastal surface <inline-formula><mml:math id="M3" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub></alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff2">
          <name><surname>Wu</surname><given-names>Zelun</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-9480-2738</ext-link></contrib>
        <contrib contrib-type="author" corresp="yes" rid="aff3">
          <name><surname>Lu</surname><given-names>Wenfang</given-names></name>
          <email>luwf6@sysu.edu.cn</email>
        <ext-link>https://orcid.org/0000-0003-1303-9820</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4">
          <name><surname>Roobaert</surname><given-names>Alizée</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-4168-5494</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5">
          <name><surname>Song</surname><given-names>Luping</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Yan</surname><given-names>Xiao-Hai</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Cai</surname><given-names>Wei-Jun</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-3606-8325</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>State Key Laboratory of Marine Environmental Science &amp; College of Ocean and Earth Science, Xiamen University, Xiamen, Fujian, 361102, China</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>School of Marine Science and Policy, University of Delaware, Newark, Delaware 19716, USA</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>School of Marine Sciences, State Key Laboratory of Environmental Adaptability for Industrial Products, Sun Yat-sen University, Zhuhai, Guangdong, 519082, China</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>Flanders Marine Institute (VLIZ), Jacobsenstraat 1, Ostend, 8400, Belgium</institution>
        </aff>
        <aff id="aff5"><label>5</label><institution>School of Marine Science and Technology, Zhejiang Ocean University, Zhoushan, Zhejiang, 316022, China</institution>
        </aff>
      </contrib-group>
      <author-notes><corresp id="corr1">Wenfang Lu (luwf6@sysu.edu.cn)</corresp></author-notes><pub-date><day>8</day><month>January</month><year>2025</year></pub-date>
      
      <volume>17</volume>
      <issue>1</issue>
      <fpage>43</fpage><lpage>63</lpage>
      <history>
        <date date-type="received"><day>21</day><month>July</month><year>2024</year></date>
           <date date-type="rev-request"><day>19</day><month>August</month><year>2024</year></date>
           <date date-type="rev-recd"><day>2</day><month>November</month><year>2024</year></date>
           <date date-type="accepted"><day>11</day><month>November</month><year>2024</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2025 Zelun Wu et al.</copyright-statement>
        <copyright-year>2025</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025.html">This article is available from https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025.html</self-uri><self-uri xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025.pdf">The full text article is available as a PDF file from https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e188">Insufficient spatiotemporal coverage of observations of the surface partial pressure of CO<sub>2</sub> (<inline-formula><mml:math id="M6" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>) has hindered precise carbon cycle studies in coastal oceans and justifies the development of spatially and temporally continuous <inline-formula><mml:math id="M8" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data products. Earlier <inline-formula><mml:math id="M10" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products have difficulties in capturing the heterogeneity of regional variations and decadal trends of <inline-formula><mml:math id="M12" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the North American Atlantic Coastal Ocean Margin (NAACOM). This study developed a regional reconstructed <inline-formula><mml:math id="M14" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product for the NAACOM (Reconstructed Coastal Acidification Database-<inline-formula><mml:math id="M16" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, or ReCAD-NAACOM-<inline-formula><mml:math id="M18" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>) using a two-step approach combining random forest regression and linear regression. The product provides monthly <inline-formula><mml:math id="M20" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data at 0.25° spatial resolution from 1993 to 2021, enabling investigation of regional spatial differences, seasonal cycles, and decadal changes in <inline-formula><mml:math id="M22" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. The observation-based reconstruction was trained using Surface Ocean CO<sub>2</sub> Atlas (SOCAT) observations as observational values, with various satellite-derived and reanalysis environmental variables known to control sea surface <inline-formula><mml:math id="M25" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> as model inputs. The product shows high accuracy during the model training, validation, and independent test phases, demonstrating robustness and a capability to accurately reconstruct <inline-formula><mml:math id="M27" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in regions or periods lacking direct observational data. Compared with all the observation samples from SOCAT, the <inline-formula><mml:math id="M29" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product yields a determination coefficient of 0.92, a root-mean-square error of 12.70 <inline-formula><mml:math id="M31" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, and an accumulative uncertainty of 23.25 <inline-formula><mml:math id="M32" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm. The ReCAD-NAACOM-<inline-formula><mml:math id="M33" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product demonstrates its capability to resolve seasonal cycles, regional-scale variations, and decadal trends of <inline-formula><mml:math id="M35" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> along the NAACOM. This new product provides reliable <inline-formula><mml:math id="M37" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data for more precise studies of coastal carbon dynamics in the NAACOM region. The dataset is publicly accessible at <uri>https://doi.org/10.5281/zenodo.14038561</uri> (Wu et al., 2024a) and will be updated regularly.</p>
  </abstract>
    
<funding-group>
<award-group id="gs1">
<funding-source>Southern Marine Science and Engineering Guangdong Laboratory (Guangzhou)</funding-source>
<award-id>SML2023SP238</award-id>
</award-group>
<award-group id="gs2">
<funding-source>Xiamen University</funding-source>
<award-id>n/a</award-id>
</award-group>
</funding-group>
</article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e482">Accurate and comprehensive datasets of the sea surface partial pressure of CO<sub>2</sub> (<inline-formula><mml:math id="M40" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>) are necessary for quantifying coastal CO<sub>2</sub> uptake and assessing the impact of climate change on coastal ocean ecosystems. On a global scale, the coastal ocean, covering 8.4 % (30.4 <inline-formula><mml:math id="M43" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 10<sup>6</sup> km<sup>2</sup>) of the global ocean surface area (Chen et al., 2013; Dai et al., 2022), plays a significant role in the global carbon budget, accounting for approximately 10.9 % of the global ocean CO<sub>2</sub> uptake from the atmosphere (0.25 of 2.3 Pg C yr<sup>−1</sup>) on the global average (Dai et al., 2022; Friedlingstein et al., 2023). However, on regional scales, areal-based CO<sub>2</sub> uptake in specific coastal regions are often much greater than those in open oceans despite their less distinguishable global means (Dai et al., 2022). This is because sea surface <inline-formula><mml:math id="M49" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> is highly variable due to the influence of various physical and biogeochemical processes in coastal oceans, such as riverine input, upwelling, tidal mixing, and large-scale circulations (Laruelle et al., 2018; Roobaert et al., 2024b). Thus, accurately quantifying the CO<sub>2</sub> uptake in specific coastal regions becomes particularly challenging when only using observations due to the incomplete coverage of <inline-formula><mml:math id="M52" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data in space and time.</p>
      <p id="d2e617">This study focuses on the North American Atlantic Coastal Ocean Margin (NAACOM; Fig. 1). The entire region is defined as the area within 400 km of the coastline and is divided into six subregions following Fennel et al. (2019) based on their geographic locations: the Gulf of Mexico (GoMx), South Atlantic Bight (SAB), Mid-Atlantic Bight (MAB), Gulf of Maine (GoMe), Scotian Shelf (SS), and Gulf of St. Lawrence and Grand Banks (GStL&amp;GB). The carbonate system in the NAACOM is influenced by large-scale circulations (Fig. 1), including the Gulf Stream and Labrador Current, as well as local processes like river discharge, export from marshes, and upwelling dynamics (Cai et al., 2020; Fennel et al., 2019; Wang et al., 2013). These complex physical and biogeochemical processes contribute to substantial spatial and temporal heterogeneity in sea surface <inline-formula><mml:math id="M54" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the NAACOM (Cai et al., 2020). Elucidating the driving mechanisms of these spatiotemporal <inline-formula><mml:math id="M56" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> variations necessitates extensive data coverage in time and space in this region. Over the past 2 decades, coastal field investigation efforts in this region have substantially increased through programs like the East Coast Ocean Acidification (ECOA) and Gulf of Mexico Ecosystems and Carbon Cruise (GOMECC) (Cai et al., 2020; Wang et al., 2013; Wanninkhof et al., 2015). Ongoing measurements from these cruises, combined with ongoing measurements from volunteer observing ships and buoys, are quality-controlled and compiled in the Surface Ocean CO<sub>2</sub> Atlas (SOCAT) database (Bakker et al., 2016), substantially advancing our understanding of coastal inorganic carbon chemistry along the NAACOM (Cai et al., 2020).</p>
      <p id="d2e661">Despite significant progress in observational efforts, the spatial and temporal coverage of <inline-formula><mml:math id="M59" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data remains limited in the NAACOM, with observations encompassing only 2.9 % of grid cells during the period 1993–2021 (Fig. 2). Observations are concentrated in the southern region, with fewer samples available during winter. This data scarcity introduces substantial uncertainty into air–sea CO<sub>2</sub> exchange quantification and hinders comprehensive understanding of coastal inorganic carbon dynamics, particularly in areas north of Cape Cod where measurements are very sparse (Fig. 2). For example, reported air–sea CO<sub>2</sub> fluxes for the GoMe exhibit a wide range spanning from <inline-formula><mml:math id="M63" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.50</mml:mn></mml:mrow></mml:math></inline-formula> to <inline-formula><mml:math id="M64" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.50</mml:mn></mml:mrow></mml:math></inline-formula> mol C m<sup>−2</sup> yr<sup>−1</sup>, with conflicting reports characterizing it as a CO<sub>2</sub> source (Fennel and Wilkin, 2009; Vandemark et al., 2011), CO<sub>2</sub>-neutral (Signorini et al., 2013), or a CO<sub>2</sub> sink (Cahill et al., 2016; Rutherford et al., 2021), underscoring the need for improved <inline-formula><mml:math id="M70" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data coverage.</p>

      <fig id="Ch1.F1" specific-use="star"><label>Figure 1</label><caption><p id="d2e791">Topography (m) and large-scale circulation along the North American Atlantic Coastal Ocean Margin (NAACOM). The study region, defined as coastal areas extending 400 km offshore, is indicated by blue shading. The thick black line is the 200 m isobath, which roughly marks the shelf break and typically defines the continental shelf boundary. The Gulf Stream (thick red dashed line with an arrow) flows northward along the eastern coast of the United States before veering eastward into the open Atlantic Ocean around Cape Hatteras. The Labrador Current (thick light-blue dashed line with an arrow) flows southward along the eastern coast of Canada before meeting the Gulf Stream. Following Fennel et al. (2019), the study region is divided into six subregions by straight orange lines: the Gulf of Mexico (GoMx), South Atlantic Bight (SAB), Mid-Atlantic Bight (MAB), Gulf of Maine (GoMe), Scotian Shelf (SS), and Gulf of St. Lawrence and Grand Banks (GStL&amp;GB). Dashed contour lines indicate bathymetric depths of 50 and 100 m on the shelf (from the coastline to the 200 m isobath) and 1000, 2000, 3000, and 4000 m from the shelf break to the open ocean.</p></caption>
        <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f01.png"/>

      </fig>

      <p id="d2e800">Recently, various <inline-formula><mml:math id="M72" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products, global or regional, with full coverage in time and space were developed as essential supplements to observations. These products usually employed diverse algorithms, environmental proxies from satellites and reanalysis products as model inputs, and SOCAT observations as constraints to reconstruct the <inline-formula><mml:math id="M74" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> field with full temporal and spatial coverage. The development of those products has significantly advanced our understanding of inorganic carbon chemistry and the ocean carbon cycle. For example, seven global <inline-formula><mml:math id="M76" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products were used to evaluate the ocean CO<sub>2</sub> uptake in the Global Carbon Budget 2023 edition (Friedlingstein et al., 2023). However, most of these products reconstruct <inline-formula><mml:math id="M79" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the open ocean, with coastal regions often being extrapolated or excluded. Currently, only one <inline-formula><mml:math id="M81" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product has been developed specifically for the coastal ocean on a global scale (Laruelle et al., 2017; Roobaert et al., 2024a). This product was recently combined with an open-ocean product to create a global reconstruction of the ocean CO<sub>2</sub> sink (Landschützer et al., 2020) and has since been utilized to narrow the variability in global reconstructions (Fay et al., 2021). However, global products primarily aim to ensure high accuracy of parameters on a global average; they may not guarantee equivalent accuracy for spatiotemporal variations on the regional scale. In comparison, regional <inline-formula><mml:math id="M84" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products have demonstrated superior capability in resolving detailed small-scale variations.</p>
      <p id="d2e919">Within the NAACOM region, several area-specific <inline-formula><mml:math id="M86" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products have been reconstructed, focusing on specific regions such as the GoMx (e.g., Chen and Hu, 2019; Fu et al., 2020; Lohrenz and Cai, 2006) and the SAB and MAB (e.g., Wang et al., 2024; Xu et al., 2020). These regional and global <inline-formula><mml:math id="M88" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products are valuable for validating model estimations (Roobaert et al., 2022; Ross et al., 2023). However, existing products often have limitations in spatial coverage, temporal resolution, or trend analysis capabilities. For instance, Chen and Hu (2019) provided a high-resolution (4 km) <inline-formula><mml:math id="M90" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product for the GoMx, but this product faces challenges in capturing decadal changes in <inline-formula><mml:math id="M92" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (Wu et al., 2024b). Conversely, Xu et al. (2020) successfully captured decadal trends of <inline-formula><mml:math id="M94" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> but only as area-averaged <inline-formula><mml:math id="M96" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> time series for the SAB and MAB, lacking comprehensive spatial coverage. Signorini et al. (2013) reconstructed a product using multiple linear regression (MLR) covering the areas from the SAB to SS, but this only spans 8 years (2003–2010). Despite these valuable efforts, there remains a lack of comprehensive data products that adequately capture regional variations, seasonal cycles, and decadal changes in <inline-formula><mml:math id="M98" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> simultaneously for the entire NAACOM.</p>
      <p id="d2e1036">This study aims to develop a regional <inline-formula><mml:math id="M100" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product specifically designed for the NAACOM, encompassing coastal regions extending 400 km offshore from the GoMx to the GB (Fig. 1). We integrated random forest and linear regression methods with hydrological parameters from satellite observations and reanalysis data to generate a monthly reconstructed <inline-formula><mml:math id="M102" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product at 0.25° spatial resolution spanning the period from 1993 to 2021. The <inline-formula><mml:math id="M104" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product, termed the Reconstructed Coastal Acidification Database or ReCAD-NAACOM-<inline-formula><mml:math id="M106" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, is specifically designed to resolve the spatial variations, seasonal cycles, and decadal changes of <inline-formula><mml:math id="M108" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> along the NAACOM.</p>
      <p id="d2e1120">The structure of this paper is as follows: Sect. 2 details the methodology used to reconstruct ReCAD-NAACOM-<inline-formula><mml:math id="M110" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and describes the datasets employed. Section 3 evaluates the accuracy of the reconstructed product, performance, and applicability in resolving seasonal cycles, regional variations, and decadal trends of <inline-formula><mml:math id="M112" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. Sections 4 and 5 provide links to access the dataset and codes used to generate the dataset and figures presented in this study. The final section summarizes the conclusions. ReCAD-NAACOM-<inline-formula><mml:math id="M114" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> demonstrates enhanced capability in resolving spatial variations and capturing the seasonal cycle and decadal trends of <inline-formula><mml:math id="M116" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> compared to the global products across different subregions in the NAACOM. This product offers improved insights into coastal carbon dynamics in this complex region, addressing the need for a comprehensive <inline-formula><mml:math id="M118" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> dataset in the NAACOM. Applications of this data product to examine the processes controlling the spatial variability, seasonal cycle, and decadal trends of <inline-formula><mml:math id="M120" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and air–sea CO<sub>2</sub> flux will be published separately.</p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Data and methods</title>
<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>Observational data from SOCAT</title>
      <p id="d2e1245">The observational data for training the regression model were measurements of the seawater fugacity of CO<sub>2</sub> (<inline-formula><mml:math id="M124" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub>) extracted from the SOCAT database (2023 edition). <inline-formula><mml:math id="M126" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> represents the <inline-formula><mml:math id="M128" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> corrected for the nonideal behavior of the gas in seawater, and both are commonly used in oceanographic studies. SOCAT compiles quality-controlled <inline-formula><mml:math id="M130" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> measurements from various platforms, including research vessels, commercial ships, and moorings (Bakker et al., 2016). This study used the monthly gridded SOCAT coastal product with a spatial resolution of 0.25° <inline-formula><mml:math id="M132" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.25° (but with data gaps). The gridded product incorporated measurements with quality flags A and B (uncertainty of 2 <inline-formula><mml:math id="M133" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) and C and D (uncertainty of 5 <inline-formula><mml:math id="M134" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) (Bakker et al., 2016). Over the period of 1993–2021, the SOCAT product encompassed 55 347 grid cells within our study area (Fig. 2), accounting for approximately 2.9 % of the total number of grid cells in the NAACOM. The observational data show a lower sampling density in the areas north of Cape Cod and the western and southern GoMx (blue box in Fig. 2). The temporal distribution of the samples exhibits a notable bias, with reduced collection during winter (Fig. 2d). Despite these spatial and temporal heterogeneities, the SOCAT observations provide coverage across all subregions and seasons of the NAACOM (Fig. 2). This comprehensive, albeit sparse, coverage facilitates the reconstruction of the <inline-formula><mml:math id="M135" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and <inline-formula><mml:math id="M137" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> field through interpolation and regression techniques.</p>

      <fig id="Ch1.F2" specific-use="star"><label>Figure 2</label><caption><p id="d2e1380">Spatial distribution of sea surface <inline-formula><mml:math id="M139" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> observations from the SOCAT database (2023 edition) in the NAACOM across the four seasons from 1993 to 2021. Grid samples with data were counted by season: <bold>(a)</bold> spring (March to May), <bold>(b)</bold> summer (June to August), <bold>(c)</bold> fall (September to November), and <bold>(d)</bold> winter (December to February). The study region is divided into northern (blue box) and southern (red box) areas at approximately 41.5° N (Cape Cod). The number and percentage of the grid samples are indicated for each region by season. The color scale represents <inline-formula><mml:math id="M141" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values (<inline-formula><mml:math id="M143" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm). A higher sampling density is evident in the southern area. Winter shows the lowest overall sampling coverage. Note that the SOCAT database provides quality-controlled <inline-formula><mml:math id="M144" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> measurements as the default parameters, which are subsequently converted into <inline-formula><mml:math id="M146" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> using Eq. (2).</p></caption>
          <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f02.png"/>

        </fig>

</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title>Model design</title>
      <p id="d2e1483">The procedures for developing and reconstructing the <inline-formula><mml:math id="M148" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product are illustrated in Fig. 3. Initially, the input variables and sea surface <inline-formula><mml:math id="M150" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data were matched to create a comprehensive dataset. To maintain consistency with the SOCAT database, which reports seawater CO<sub>2</sub> concentrations as <inline-formula><mml:math id="M153" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, we adopted <inline-formula><mml:math id="M155" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> as the model training label and first-step output variable in our model. During the model development phase, <inline-formula><mml:math id="M157" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> measurements served as training labels for the machine-learning algorithm. The matched dataset was then divided into two sets: X1, encompassing the periods 1993–2003 and 2006–2021, and X2, covering 2004–2005. Set X1 was randomly subdivided further, with 80 % allocated for model training and the remaining 20 % for the validation test. Set X2 served as an independent test set. The model training set (80 % of X1) was used to develop a two-step RFR–LR (random forest regression–linear regression) model. The RFR model is designed to capture complex, nonlinear relationships between the input variables and the target variable (i.e., <inline-formula><mml:math id="M159" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub>), while the LR model is subsequently applied to mitigate potential systematic biases in RFR-derived <inline-formula><mml:math id="M161" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values arising from spatiotemporal heterogeneities in the SOCAT observational dataset (Fig. 2). RFR, an ensemble learning technique, combines multiple decision trees to produce more accurate and stable predictions (Breiman, 2001; Lu et al., 2019). Each decision tree in the RFR model is trained on a randomly selected subset of the input data, with the final prediction derived from the average output of all the trees. This approach mitigates overfitting and enhances the generalization performance of the model, making it particularly suitable for large datasets with complex, nonlinear variable relationships. The RFR model was trained using 10-fold cross-validation with optimized hyperparameters, including a minimum leaf size of 1, a bagging method for ensemble aggregation, and 300 learning cycles after tuning. After RFR model training, the LR model was applied to the RFR-estimated <inline-formula><mml:math id="M163" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (<inline-formula><mml:math id="M165" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2est</sub>) output to make sure that the RFR model was not systematically biased:
            <disp-formula id="Ch1.E1" content-type="numbered"><label>1</label><mml:math id="M167" display="block"><mml:mrow><mml:mi>f</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi mathvariant="normal">obs</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mi>a</mml:mi><mml:mo>×</mml:mo><mml:mi>f</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi mathvariant="normal">est</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>b</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="italic">ε</mml:mi><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where <inline-formula><mml:math id="M168" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2obs</sub> is the observed <inline-formula><mml:math id="M170" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> from SOCAT, <inline-formula><mml:math id="M172" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> is the linear regression coefficient, <inline-formula><mml:math id="M173" display="inline"><mml:mi>b</mml:mi></mml:math></inline-formula> is the intercept, and <inline-formula><mml:math id="M174" display="inline"><mml:mi mathvariant="italic">ε</mml:mi></mml:math></inline-formula> is the residual that the linear model cannot resolve. This additional step was implemented to mitigate potential systematic bias in the RFR model that could arise from areas with a higher sampling density, thereby ensuring a more balanced representation across the entire study region. The comparison between the estimated <inline-formula><mml:math id="M175" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> before and after LR calibration is presented in Appendix A. The calibration was applied to each grid cell individually. To increase the data pool for linear regression, samples within a 5 <inline-formula><mml:math id="M177" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 5 grid window in space (i.e., 1.25° <inline-formula><mml:math id="M178" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 1.25°) were aggregated for LR model development. As the available measurements could not cover every grid cell and were insufficient to produce continuous spatial maps of the calibration coefficients (i.e., <inline-formula><mml:math id="M179" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M180" display="inline"><mml:mi>b</mml:mi></mml:math></inline-formula> in Eq. 1), we employed a locally interpolated regression strategy similar to that of Carter et al. (2018). Mathematically, given the spatial and temporal continuity of <inline-formula><mml:math id="M181" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2est</sub> and <inline-formula><mml:math id="M183" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2obs</sub>, the coefficients <inline-formula><mml:math id="M185" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M186" display="inline"><mml:mi>b</mml:mi></mml:math></inline-formula> must also be continuous in space and time. Therefore, we linearly interpolated the coefficients <inline-formula><mml:math id="M187" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M188" display="inline"><mml:mi>b</mml:mi></mml:math></inline-formula> across the NAACOM. The interpolated coefficients were subsequently used to adjust the RFR-derived <inline-formula><mml:math id="M189" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2est</sub>.</p>

      <fig id="Ch1.F3" specific-use="star"><label>Figure 3</label><caption><p id="d2e1882">A flowchart of the two-step machine-learning regression model for generating the reconstructed <inline-formula><mml:math id="M191" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product. The grey boxes represent the input and output datasets. The blue boxes illustrate the model training, validation testing, and independent test processes. The orange boxes represent the final trained model for predicting the reconstructed product. The two models in the orange boxes are identical. The training data, consisting of paired input variables (longitude, latitude, month, sea surface temperature (SST), sea surface salinity (SSS), sea surface height (SSH), atmospheric <inline-formula><mml:math id="M193" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (<inline-formula><mml:math id="M195" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub>), and the corresponding sea surface <inline-formula><mml:math id="M197" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (<inline-formula><mml:math id="M199" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2sea</sub>) labels), are divided into two sets: X1 (1993–2003 and 2006–2021) and X2 (2004–2005). X1 is randomly divided further into subsets for the model training set (80 %) and the validation set (20 %). The predictive model combines a random forest regression (RFR) algorithm and a linear regression (LR) algorithm. The trained and validated regression model is then applied to all satellite and reanalysis data (without gaps) to generate the 3D reconstructed <inline-formula><mml:math id="M201" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2sea</sub> product, which is then converted into <inline-formula><mml:math id="M203" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2sea</sub> with satellite SST data.</p></caption>
          <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f03.png"/>

        </fig>

      <p id="d2e2017">The validation set, comprising 20 % of X1 randomly sampled from 1993–2003 and 2006–2021, serves as a critical monitoring step for model evaluation. This subset plays two key roles: first, it tests hyperparameter tuning by providing independent performance metrics on unseen data, and second, it helps detect potential overfitting by monitoring the divergence between training and validation performance. While the validation set itself cannot prevent overfitting, it enables the detection of overfitting patterns when the performance of the model improves on training data but deteriorates on validation data. Through this continuous evaluation process, the validation set ensures more robust model development and helps achieve better generalization capabilities.</p>
      <p id="d2e2021">The independent test set (X2), covering the years 2004–2005, serves as a critical evaluation period specifically designed to assess the reliability of the model in predicting values for years that were completely excluded from both the training and validation phases. Because we intentionally withhold these 2 years from model development, this approach directly tests the capability of the model to generate reliable predictions and fill temporal data gaps for periods without observational data.</p>
      <p id="d2e2024">Finally, the trained model is applied to all the satellite and reanalysis data to generate the final gap-free reconstructed <inline-formula><mml:math id="M205" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data. As most products reported seawater CO<sub>2</sub> concentrations as <inline-formula><mml:math id="M208" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, we subsequently converted the reconstructed <inline-formula><mml:math id="M210" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values into <inline-formula><mml:math id="M212" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> using the following equation (Takahashi et al., 2020), and our final product reports both <inline-formula><mml:math id="M214" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and <inline-formula><mml:math id="M216" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>:
            <disp-formula id="Ch1.E2" content-type="numbered"><label>2</label><mml:math id="M218" display="block"><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>=</mml:mo><mml:mi>f</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>×</mml:mo><mml:mo>(</mml:mo><mml:mn mathvariant="normal">1.00436</mml:mn><mml:mo>-</mml:mo><mml:mn mathvariant="normal">4.669</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:msup><mml:mo>×</mml:mo><mml:mi mathvariant="normal">SST</mml:mi><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
</sec>
<sec id="Ch1.S2.SS3">
  <label>2.3</label><title>Regression model input variables from satellite and reanalysis</title>
      <p id="d2e2194">The input variables for training the regression model are longitude (long), latitude (lat), month, sea surface temperature (SST), sea surface salinity (SSS), sea surface height (SSH), and atmospheric <inline-formula><mml:math id="M219" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (<inline-formula><mml:math id="M221" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub>). Longitude, latitude, and month serve as spatiotemporal predictors, enabling the algorithm to identify and capture regional and seasonal variability in <inline-formula><mml:math id="M223" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> within the study area (Su et al., 2020; Yang et al., 2024). SST, SSS, and SSH are critical variables that characterize the physical and biogeochemical ocean settings, which play a crucial role in determining the spatial and temporal variability of <inline-formula><mml:math id="M225" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. <inline-formula><mml:math id="M227" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub> represents the atmospheric forcing in the air–sea CO<sub>2</sub> exchange. Including <inline-formula><mml:math id="M230" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub> is essential for accurately assessing the decadal <inline-formula><mml:math id="M232" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> trend.</p>
      <p id="d2e2329">SST data were obtained from the National Oceanic and Atmospheric Administration (NOAA) Optimum Interpolation Sea Surface Temperature (OISST) v2.1 product (Huang et al., 2021). The OISST dataset is a global gridded SST analysis that blends observations from various sources, including satellites, ships, and buoys. The dataset employs an optimum interpolation technique to combine these observations and generate a daily SST field at a spatial resolution of 0.25° <inline-formula><mml:math id="M234" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.25°. For this study, the daily SST data were averaged to create a monthly product.</p>
      <p id="d2e2339">SSS data were obtained from the Simple Ocean Data Assimilation (SODA) v3.15.2 product (Carton et al., 2018). SODA is a comprehensive reanalysis dataset that integrates a global ocean model with observational data to estimate ocean state variables consistently. The SODA system assimilates observations from multiple sources, including floats, moorings, and ship-based measurements, thereby constraining the model output and enhancing the accuracy of the represented ocean physical properties, including SSS. The SODA v3.15.2 product offers monthly SSS data with a temporal resolution of 1 month and a spatial resolution of 0.5° <inline-formula><mml:math id="M235" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.5°, which were linearly interpolated to a 0.25° <inline-formula><mml:math id="M236" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.25° grid resolution to maintain consistency with other input variables and the gridded SOCAT <inline-formula><mml:math id="M237" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data. Note that such interpolation could potentially introduce additional errors. We doubled the SSS uncertainty in the region, assuming that this would encompass its true uncertainty (see Appendix B).</p>
      <p id="d2e2372">SSH data were extracted from the Global Ocean Gridded L4 Sea Surface Heights (CMEMS, 2021) created by the Copernicus Marine Environment Monitoring Service (CMEMS). Since 1993 (ongoing) this product has provided daily SSH data derived from altimeters with a spatial resolution of 0.25° <inline-formula><mml:math id="M239" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.25°. Daily SSH data were averaged to monthly means.</p>
      <p id="d2e2383"><inline-formula><mml:math id="M240" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub> data converted from the mole fraction of CO<sub>2</sub> in dry air (xCO<sub>2air</sub>) were downloaded from the NOAA Marine Boundary Layer (MBL) reference product (Lan et al., 2023). The MBL reference product provides weekly zonal average xCO<sub>2air</sub> measurements from a global observation network. The xCO<sub>2air</sub> data were linearly interpolated to the same spatial and temporal resolution as the other input variables (0.25° <inline-formula><mml:math id="M246" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.25°, monthly). xCO<sub>2air</sub> was converted into <inline-formula><mml:math id="M248" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub> with the equation
            <disp-formula id="Ch1.E3" content-type="numbered"><label>3</label><mml:math id="M250" display="block"><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi mathvariant="normal">air</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">xCO</mml:mi></mml:mrow><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi mathvariant="normal">air</mml:mi></mml:mrow></mml:msub><mml:mo>×</mml:mo><mml:mo>(</mml:mo><mml:mi>P</mml:mi><mml:mo>-</mml:mo><mml:msub><mml:mi>p</mml:mi><mml:mi mathvariant="normal">w</mml:mi></mml:msub><mml:mo>)</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where <inline-formula><mml:math id="M251" display="inline"><mml:mi>P</mml:mi></mml:math></inline-formula> is the total atmospheric pressure on the sea surface, which was downloaded from the fifth-generation reanalysis (ERA5) of the European Centre for Medium-Range Weather Forecasts (ECMWF) (Hersbach et al., 2019), and <inline-formula><mml:math id="M252" display="inline"><mml:mrow><mml:msub><mml:mi>p</mml:mi><mml:mi mathvariant="normal">w</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the water vapor pressure, which was calculated using the formula of Weiss and Price (1980), SST from OISST, and SSS from SODA.</p>
</sec>
<sec id="Ch1.S2.SS4">
  <label>2.4</label><title>Evaluation of the models</title>
      <p id="d2e2561">The accuracy of the model outputs was assessed using several statistical metrics, including the coefficient of determination (<inline-formula><mml:math id="M253" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>), root-mean-square error (RMSE), mean absolute error (MAE), and mean bias error (MBE). These metrics were calculated for the training and validation set phases as well as for the independent validation set:

                <disp-formula specific-use="gather" content-type="numbered"><mml:math id="M254" display="block"><mml:mtable displaystyle="true"><mml:mlabeledtr id="Ch1.E4"><mml:mtd><mml:mtext>4</mml:mtext></mml:mtd><mml:mtd><mml:mrow><mml:mstyle displaystyle="true" class="stylechange"/><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mo>=</mml:mo><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mi>i</mml:mi><mml:mi>N</mml:mi></mml:msubsup><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">obs</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">est</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>/</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mi>i</mml:mi><mml:mi>N</mml:mi></mml:msubsup><mml:msup><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">obs</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr><mml:mlabeledtr id="Ch1.E5"><mml:mtd><mml:mtext>5</mml:mtext></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:mi mathvariant="normal">RMSE</mml:mi><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>N</mml:mi></mml:mfrac></mml:mstyle><mml:msubsup><mml:mo>∑</mml:mo><mml:mi>i</mml:mi><mml:mi>N</mml:mi></mml:msubsup><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">obs</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">est</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:msqrt><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr><mml:mlabeledtr id="Ch1.E6"><mml:mtd><mml:mtext>6</mml:mtext></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:mi mathvariant="normal">MAE</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>N</mml:mi></mml:mfrac></mml:mstyle><mml:msubsup><mml:mo>∑</mml:mo><mml:mi>i</mml:mi><mml:mi>N</mml:mi></mml:msubsup><mml:mfenced open="|" close="|"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">obs</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">est</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr><mml:mlabeledtr id="Ch1.E7"><mml:mtd><mml:mtext>7</mml:mtext></mml:mtd><mml:mtd><mml:mrow><mml:mstyle displaystyle="true" class="stylechange"/><mml:mi mathvariant="normal">MBE</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>N</mml:mi></mml:mfrac></mml:mstyle><mml:msubsup><mml:mo>∑</mml:mo><mml:mi>i</mml:mi><mml:mi>N</mml:mi></mml:msubsup><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">obs</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi mathvariant="normal">est</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr></mml:mtable></mml:math></disp-formula>

            where <inline-formula><mml:math id="M255" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula> denotes the <inline-formula><mml:math id="M256" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>th sample, <inline-formula><mml:math id="M257" display="inline"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M258" display="inline"><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:math></inline-formula> are the observed <inline-formula><mml:math id="M259" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values from SOCAT and their average, <inline-formula><mml:math id="M261" display="inline"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi mathvariant="normal">est</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> represents the predicted <inline-formula><mml:math id="M262" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values from the final model, and <inline-formula><mml:math id="M264" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula> is the total number of matched samples.</p>
</sec>
<sec id="Ch1.S2.SS5">
  <label>2.5</label><title>Uncertainty of the reconstructed <inline-formula><mml:math id="M265" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub></title>
      <p id="d2e2944">The uncertainty of the estimated <inline-formula><mml:math id="M267" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in our product for each grid cell was accumulated from four sources of uncertainties: the direct <inline-formula><mml:math id="M269" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> measurement uncertainty from SOCAT (<inline-formula><mml:math id="M271" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), gridding uncertainty (<inline-formula><mml:math id="M272" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), mapping uncertainty (<inline-formula><mml:math id="M273" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), and the uncertainty accumulated from the input variables (<inline-formula><mml:math id="M274" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>). The first three sources of uncertainty were calculated according to the approach used by earlier reconstructed <inline-formula><mml:math id="M275" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products (Landschützer et al., 2014; Roobaert et al., 2024a; Sharp et al., 2022). <inline-formula><mml:math id="M277" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is inherited from the SOCAT observations. The SOCAT database uses discrete samples with quality flags A and B (accuracy <inline-formula><mml:math id="M278" display="inline"><mml:mrow><mml:mi mathvariant="italic">&lt;</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M279" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) and C and D (accuracy <inline-formula><mml:math id="M280" display="inline"><mml:mrow><mml:mi mathvariant="italic">&lt;</mml:mi><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M281" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) to create the gridded file. Adopting a conservative approach, we used the maximum <inline-formula><mml:math id="M282" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> of 5 <inline-formula><mml:math id="M283" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm. <inline-formula><mml:math id="M284" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> was calculated as the standard deviation of the samples used to calculate the gridded <inline-formula><mml:math id="M285" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in each grid cell. <inline-formula><mml:math id="M287" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is introduced by reconstructing the <inline-formula><mml:math id="M288" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> using the RFR–LR model. It was evaluated as the RMSE between the reconstructed <inline-formula><mml:math id="M290" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and the observed <inline-formula><mml:math id="M292" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values following Roobaert et al. (2024a) and Sharp et al. (2022). Given that the derivation of <inline-formula><mml:math id="M294" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M295" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M296" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is contingent upon SOCAT observations, these three uncertainties and the total uncertainty <inline-formula><mml:math id="M297" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> are reported on a subregional basis.</p>
      <p id="d2e3247">In addition to these three sources of uncertainty, this study incorporated cumulative uncertainties from input variables (<inline-formula><mml:math id="M298" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), including SST, SSS, SSH, and <inline-formula><mml:math id="M299" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub>. These satellite-derived or reanalysis-based variables inherently possess uncertainties that propagate nonlinearly through the regression model, ultimately affecting the estimated <inline-formula><mml:math id="M301" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values (Wang et al., 2021, 2023). We employed a Monte Carlo simulation to calculate <inline-formula><mml:math id="M303" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>. For each input variable (SST, SSS, SSH, and <inline-formula><mml:math id="M304" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub>), we added white noise following a normal distribution <inline-formula><mml:math id="M306" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>(</mml:mo><mml:mn mathvariant="normal">0</mml:mn><mml:mo>,</mml:mo><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="M307" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the uncertainty of the respective input variable <inline-formula><mml:math id="M308" display="inline"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>. We then recalculated <inline-formula><mml:math id="M309" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> using these noise-added inputs and determined the resulting changes in <inline-formula><mml:math id="M311" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. This process was repeated 100 times for each input variable, and the resulting uncertainty in <inline-formula><mml:math id="M313" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> from each variable was calculated as the standard deviation of the differences between the original reconstructed <inline-formula><mml:math id="M315" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and the <inline-formula><mml:math id="M317" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values after adding noise to each grid cell. The final <inline-formula><mml:math id="M319" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> was computed as the square root of the quadratic sum of these individual uncertainties from the four input variables. Detailed procedures for determining <inline-formula><mml:math id="M320" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are described in Appendix B.</p>
      <p id="d2e3482">Assuming that these sources are independent, the uncertainty of the estimated gridded <inline-formula><mml:math id="M321" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in our product, <inline-formula><mml:math id="M323" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>, was calculated using the error propagation (Hughes and Hase, 2010; Taylor, 1997):
            <disp-formula id="Ch1.E8" content-type="numbered"><label>8</label><mml:math id="M324" display="block"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:msubsup><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:msqrt><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
</sec>
<sec id="Ch1.S2.SS6">
  <label>2.6</label><title>Comparison with the global reconstructed <inline-formula><mml:math id="M325" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product</title>
      <p id="d2e3601">The ReCAD-NAACOM-<inline-formula><mml:math id="M327" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product was evaluated through comparisons with seven reconstructed <inline-formula><mml:math id="M329" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products developed for the global ocean and used in the Global Carbon Budget 2023 edition (Friedlingstein et al., 2023) and one reconstructed <inline-formula><mml:math id="M331" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product specifically developed for the global coastal ocean (ULB_SOMFNN_coastal_v2; Roobaert et al., 2024a). These data products reconstructed <inline-formula><mml:math id="M333" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2sea</sub> data using different machine-learning algorithms. Detailed information on the products is summarized in Table 1.</p>

<table-wrap id="Ch1.T1" specific-use="star"><label>Table 1</label><caption><p id="d2e3675">References for the global <inline-formula><mml:math id="M335" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products used for comparison with ReCAD-NAACOM-<inline-formula><mml:math id="M337" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in this study. The abbreviations in the Methods column are RFRE for random-forest-based regression ensemble, SOM-FFN for self-organizing map–feed-forward network, MLR for multiple linear regression, FFNN for feed-forward neural network, XGB for the eXtreme Gradient Boosting algorithm, and GRaCER for geospatial random-cluster ensemble regression.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="6">
     <oasis:colspec colnum="1" colname="col1" align="justify" colwidth="2cm"/>
     <oasis:colspec colnum="2" colname="col2" align="justify" colwidth="4cm"/>
     <oasis:colspec colnum="3" colname="col3" align="justify" colwidth="3cm"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:colspec colnum="5" colname="col5" align="left"/>
     <oasis:colspec colnum="6" colname="col6" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1">Data</oasis:entry>

         <oasis:entry colname="col2">Method</oasis:entry>

         <oasis:entry colname="col3">Type</oasis:entry>

         <oasis:entry colname="col4">Period</oasis:entry>

         <oasis:entry colname="col5">Resolution</oasis:entry>

         <oasis:entry colname="col6">Source</oasis:entry>

       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>

         <oasis:entry rowsep="1" colname="col1" morerows="6">Open-ocean product</oasis:entry>

         <oasis:entry colname="col2">MPI_SOM-FFN_v2022</oasis:entry>

         <oasis:entry colname="col3">SOM-FNN</oasis:entry>

         <oasis:entry colname="col4">1982–2021</oasis:entry>

         <oasis:entry colname="col5">1° <inline-formula><mml:math id="M339" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 1°, monthly</oasis:entry>

         <oasis:entry colname="col6">Landschützer et al. (2017)</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Jena-MLS</oasis:entry>

         <oasis:entry colname="col3">MLR</oasis:entry>

         <oasis:entry colname="col4">1951–2021</oasis:entry>

         <oasis:entry colname="col5">2° <inline-formula><mml:math id="M340" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 2°, monthly</oasis:entry>

         <oasis:entry colname="col6">Rödenbeck et al. (2022)</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">CMEMS-LSCE-FFNNv2</oasis:entry>

         <oasis:entry colname="col3">Ensemble of nonlinear models</oasis:entry>

         <oasis:entry colname="col4">1985–2021</oasis:entry>

         <oasis:entry colname="col5">1° <inline-formula><mml:math id="M341" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 1°, monthly</oasis:entry>

         <oasis:entry colname="col6">Chau et al. (2022)</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">LDEO-HPD</oasis:entry>

         <oasis:entry colname="col3">XGB</oasis:entry>

         <oasis:entry colname="col4">1985–2018</oasis:entry>

         <oasis:entry colname="col5">1° <inline-formula><mml:math id="M342" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 1°, monthly</oasis:entry>

         <oasis:entry colname="col6">Gloege et al. (2022)</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">NIES-NN</oasis:entry>

         <oasis:entry colname="col3">FFNN</oasis:entry>

         <oasis:entry colname="col4">1980–2020</oasis:entry>

         <oasis:entry colname="col5">1° <inline-formula><mml:math id="M343" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 1°, monthly</oasis:entry>

         <oasis:entry colname="col6">Zeng et al. (2014)</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">JMA-MLR</oasis:entry>

         <oasis:entry colname="col3">MLR</oasis:entry>

         <oasis:entry colname="col4">1998–2022</oasis:entry>

         <oasis:entry colname="col5">1° <inline-formula><mml:math id="M344" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 1°, monthly</oasis:entry>

         <oasis:entry colname="col6">Iida et al. (2021)</oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col2">OS-ETHZ-GRaCER</oasis:entry>

         <oasis:entry colname="col3">GRaCER</oasis:entry>

         <oasis:entry colname="col4">1982–2020</oasis:entry>

         <oasis:entry colname="col5">1° <inline-formula><mml:math id="M345" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 1°, monthly</oasis:entry>

         <oasis:entry colname="col6">Gregor and Gruber (2021)</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col1">Coastal-oceanproduct</oasis:entry>

         <oasis:entry colname="col2">ULB–SOM–FFN–coastalv2</oasis:entry>

         <oasis:entry colname="col3">SOM-FNN</oasis:entry>

         <oasis:entry colname="col4">1982–2020</oasis:entry>

         <oasis:entry colname="col5">0.25° <inline-formula><mml:math id="M346" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.25°, monthly</oasis:entry>

         <oasis:entry colname="col6">Roobaert et al. (2024a)</oasis:entry>

       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Results and discussion</title>
<sec id="Ch1.S3.SS1">
  <label>3.1</label><title>Evaluating the regression model performance</title>
      <p id="d2e3985">Our product employs a two-step RFR–LR algorithm to retrieve <inline-formula><mml:math id="M347" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. The initial RFR step accurately captures most seasonal and decadal <inline-formula><mml:math id="M349" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> variations across all six subregions (Appendix A). When comparing only at matching grid cells where SOCAT measurements are available, the differences (<inline-formula><mml:math id="M351" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">12</mml:mn></mml:mrow></mml:math></inline-formula>) in the monthly mean climatology between the SOCAT- and RFR-derived <inline-formula><mml:math id="M352" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> are less than 2 <inline-formula><mml:math id="M354" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm on average, with standard deviations below 5 <inline-formula><mml:math id="M355" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm across all the subregions (Fig. A1). However, the RFR-derived <inline-formula><mml:math id="M356" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> shows lower accuracy in capturing long-term <inline-formula><mml:math id="M358" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> changes in the GoMe and SAB. The subsequent LR calibration improves the performance significantly: <inline-formula><mml:math id="M360" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> values increase from 0.69 to 0.81 in the GoMe and from 0.83 to 0.93 in the SAB, while the RMSE decreases from 12.43 to 10.51 <inline-formula><mml:math id="M361" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm in the GoMe and from 10.83 to 8.12 <inline-formula><mml:math id="M362" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm in the SAB (Fig. A2).</p>
      <p id="d2e4125">The ReCAD-NAACOM-<inline-formula><mml:math id="M363" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product demonstrated robust performance and high accuracy in capturing <inline-formula><mml:math id="M365" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> variability across the NAACOM (Fig. 4). During the model training phase, the product achieved an <inline-formula><mml:math id="M367" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> of 0.96, an RMSE of 9.1 <inline-formula><mml:math id="M368" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, an MAE of 5.92 <inline-formula><mml:math id="M369" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, and an MBE of 0.05 <inline-formula><mml:math id="M370" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm (Fig. 4a). The model demonstrated comparable performance metrics during the validation phase (Fig. 4b). To further evaluate the generalizability and robustness of the model, we also conducted an independent test using data from 2004 to 2005 in which not all the data samples were included in the model training and validation sets. During this independent test phase, the <inline-formula><mml:math id="M371" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product maintained high accuracy, with <inline-formula><mml:math id="M373" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.64</mml:mn></mml:mrow></mml:math></inline-formula>, RMSE <inline-formula><mml:math id="M374" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 27.2 <inline-formula><mml:math id="M375" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, MAE <inline-formula><mml:math id="M376" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 18.86 <inline-formula><mml:math id="M377" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, and MBE <inline-formula><mml:math id="M378" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.07 <inline-formula><mml:math id="M379" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm (Fig. 4c). Additionally, most independent validation samples were distributed around the <inline-formula><mml:math id="M380" display="inline"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>:</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> correspondence line, proving the ability of the models to predict <inline-formula><mml:math id="M381" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across unsampled spatial and temporal domains without overfitting. The model consistently demonstrated strong performance during the training, validation, and independent test phases across all the subregions (Table 2). Overall, compared with all the available samples in SOCAT, it achieved an <inline-formula><mml:math id="M383" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> of 0.92, an RMSE of 12.70 <inline-formula><mml:math id="M384" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, an MAE of 7.55 <inline-formula><mml:math id="M385" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, and an MBE of 0.13 <inline-formula><mml:math id="M386" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm for the entire NAACOM (Table 2), highlighting the generalizability of the ReCAD-NAACOM-<inline-formula><mml:math id="M387" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product and robustness in effectively capturing the variability in <inline-formula><mml:math id="M389" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and providing reliable predictions of <inline-formula><mml:math id="M391" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the studied regions.</p>

      <fig id="Ch1.F4" specific-use="star"><label>Figure 4</label><caption><p id="d2e4389">Evaluation of the regression model for reconstructing the ReCAD-NAACOM-<inline-formula><mml:math id="M393" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product. The density scatterplots compare the product-estimated <inline-formula><mml:math id="M395" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (<inline-formula><mml:math id="M397" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2est</sub>) with the in situ SOCAT observations (<inline-formula><mml:math id="M399" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2obs</sub>) during the <bold>(a)</bold> model training phase (80 % of the samples during the periods 1993–2003 and 2006–2021), <bold>(b)</bold> validation phase (20 % of the samples during the periods 1993–2003 and 2006–2021), and <bold>(c)</bold> independent test phase (samples during the period 2004–2005). The statistical metrics include the coefficient of determination (<inline-formula><mml:math id="M401" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>), root-mean-square error (RMSE), mean absolute error (MAE), mean bias error (MBE), and number of samples (<inline-formula><mml:math id="M402" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>). The color bar represents the number of data points in each bin.</p></caption>
          <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f04.png"/>

        </fig>

<table-wrap id="Ch1.T2" specific-use="star"><label>Table 2</label><caption><p id="d2e4501">Performance of the regression model during the model training, validation, and independent test phases across the different subregions. The metrics include the coefficient of determination (<inline-formula><mml:math id="M403" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>), root-mean-square error (RMSE), mean absolute error (MAE), and mean bias error (MBE). The subregions are the Gulf of Mexico (GoMx), South Atlantic Bight (SAB), Mid-Atlantic Bight (MAB), Gulf of Maine (GoMe), Scotian Shelf (SS), and Gulf of St. Lawrence and Grand Banks (GStL&amp;GB).</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="6">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Region</oasis:entry>
         <oasis:entry colname="col2">Type</oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M404" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4">RMSE (<inline-formula><mml:math id="M405" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm)</oasis:entry>
         <oasis:entry colname="col5">MAE (<inline-formula><mml:math id="M406" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm)</oasis:entry>
         <oasis:entry colname="col6">MBE (<inline-formula><mml:math id="M407" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">GStL&amp;GB</oasis:entry>
         <oasis:entry colname="col2">Training set</oasis:entry>
         <oasis:entry colname="col3">0.97</oasis:entry>
         <oasis:entry colname="col4">7.81</oasis:entry>
         <oasis:entry colname="col5">5.31</oasis:entry>
         <oasis:entry colname="col6">0.33</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Validation set</oasis:entry>
         <oasis:entry colname="col3">0.91</oasis:entry>
         <oasis:entry colname="col4">13.57</oasis:entry>
         <oasis:entry colname="col5">8.83</oasis:entry>
         <oasis:entry colname="col6">0.44</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" colname="col2">Independent test set</oasis:entry>
         <oasis:entry rowsep="1" colname="col3">0.76</oasis:entry>
         <oasis:entry rowsep="1" colname="col4">25.23</oasis:entry>
         <oasis:entry rowsep="1" colname="col5">16.82</oasis:entry>
         <oasis:entry rowsep="1" colname="col6"><inline-formula><mml:math id="M408" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">5.64</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">All</oasis:entry>
         <oasis:entry colname="col3">0.94</oasis:entry>
         <oasis:entry colname="col4">11.48</oasis:entry>
         <oasis:entry colname="col5">6.92</oasis:entry>
         <oasis:entry colname="col6"><inline-formula><mml:math id="M409" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.15</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">SS</oasis:entry>
         <oasis:entry colname="col2">Training set</oasis:entry>
         <oasis:entry colname="col3">0.96</oasis:entry>
         <oasis:entry colname="col4">9.35</oasis:entry>
         <oasis:entry colname="col5">6.61</oasis:entry>
         <oasis:entry colname="col6"><inline-formula><mml:math id="M410" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1.13</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Validation set</oasis:entry>
         <oasis:entry colname="col3">0.90</oasis:entry>
         <oasis:entry colname="col4">13.27</oasis:entry>
         <oasis:entry colname="col5">9.41</oasis:entry>
         <oasis:entry colname="col6"><inline-formula><mml:math id="M411" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.90</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" colname="col2">Independent test set</oasis:entry>
         <oasis:entry rowsep="1" colname="col3">0.50</oasis:entry>
         <oasis:entry rowsep="1" colname="col4">30.92</oasis:entry>
         <oasis:entry rowsep="1" colname="col5">24.12</oasis:entry>
         <oasis:entry rowsep="1" colname="col6"><inline-formula><mml:math id="M412" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3.50</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">All</oasis:entry>
         <oasis:entry colname="col3">0.90</oasis:entry>
         <oasis:entry colname="col4">13.82</oasis:entry>
         <oasis:entry colname="col5">8.89</oasis:entry>
         <oasis:entry colname="col6"><inline-formula><mml:math id="M413" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1.32</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">GoMe</oasis:entry>
         <oasis:entry colname="col2">Training set</oasis:entry>
         <oasis:entry colname="col3">0.95</oasis:entry>
         <oasis:entry colname="col4">10.62</oasis:entry>
         <oasis:entry colname="col5">7.72</oasis:entry>
         <oasis:entry colname="col6">0.14</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Validation set</oasis:entry>
         <oasis:entry colname="col3">0.81</oasis:entry>
         <oasis:entry colname="col4">20.12</oasis:entry>
         <oasis:entry colname="col5">14.35</oasis:entry>
         <oasis:entry colname="col6">0.83</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" colname="col2">Independent test set</oasis:entry>
         <oasis:entry rowsep="1" colname="col3">0.49</oasis:entry>
         <oasis:entry rowsep="1" colname="col4">31.66</oasis:entry>
         <oasis:entry rowsep="1" colname="col5">23.95</oasis:entry>
         <oasis:entry rowsep="1" colname="col6">3.72</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">All</oasis:entry>
         <oasis:entry colname="col3">0.90</oasis:entry>
         <oasis:entry colname="col4">14.91</oasis:entry>
         <oasis:entry colname="col5">9.97</oasis:entry>
         <oasis:entry colname="col6">0.49</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">MAB</oasis:entry>
         <oasis:entry colname="col2">Training set</oasis:entry>
         <oasis:entry colname="col3">0.97</oasis:entry>
         <oasis:entry colname="col4">9.39</oasis:entry>
         <oasis:entry colname="col5">6.60</oasis:entry>
         <oasis:entry colname="col6"><inline-formula><mml:math id="M414" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.06</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Validation set</oasis:entry>
         <oasis:entry colname="col3">0.84</oasis:entry>
         <oasis:entry colname="col4">19.49</oasis:entry>
         <oasis:entry colname="col5">13.47</oasis:entry>
         <oasis:entry colname="col6"><inline-formula><mml:math id="M415" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.19</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" colname="col2">Independent test set</oasis:entry>
         <oasis:entry rowsep="1" colname="col3">0.56</oasis:entry>
         <oasis:entry rowsep="1" colname="col4">37.93</oasis:entry>
         <oasis:entry rowsep="1" colname="col5">28.53</oasis:entry>
         <oasis:entry rowsep="1" colname="col6">7.13</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">All</oasis:entry>
         <oasis:entry colname="col3">0.93</oasis:entry>
         <oasis:entry colname="col4">13.26</oasis:entry>
         <oasis:entry colname="col5">8.44</oasis:entry>
         <oasis:entry colname="col6">0.08</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">SAB</oasis:entry>
         <oasis:entry colname="col2">Training set</oasis:entry>
         <oasis:entry colname="col3">0.96</oasis:entry>
         <oasis:entry colname="col4">6.76</oasis:entry>
         <oasis:entry colname="col5">4.24</oasis:entry>
         <oasis:entry colname="col6">0.30</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Validation set</oasis:entry>
         <oasis:entry colname="col3">0.87</oasis:entry>
         <oasis:entry colname="col4">12.03</oasis:entry>
         <oasis:entry colname="col5">6.98</oasis:entry>
         <oasis:entry colname="col6">0.98</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" colname="col2">Independent test set</oasis:entry>
         <oasis:entry rowsep="1" colname="col3">0.73</oasis:entry>
         <oasis:entry rowsep="1" colname="col4">23.60</oasis:entry>
         <oasis:entry rowsep="1" colname="col5">16.75</oasis:entry>
         <oasis:entry rowsep="1" colname="col6">1.33</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">All</oasis:entry>
         <oasis:entry colname="col3">0.91</oasis:entry>
         <oasis:entry colname="col4">10.63</oasis:entry>
         <oasis:entry colname="col5">5.95</oasis:entry>
         <oasis:entry colname="col6">0.52</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">GoMx</oasis:entry>
         <oasis:entry colname="col2">Training set</oasis:entry>
         <oasis:entry colname="col3">0.94</oasis:entry>
         <oasis:entry colname="col4">9.13</oasis:entry>
         <oasis:entry colname="col5">5.14</oasis:entry>
         <oasis:entry colname="col6">0.08</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Validation set</oasis:entry>
         <oasis:entry colname="col3">0.76</oasis:entry>
         <oasis:entry colname="col4">19.08</oasis:entry>
         <oasis:entry colname="col5">9.82</oasis:entry>
         <oasis:entry colname="col6">0.74</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" colname="col2">Independent test set</oasis:entry>
         <oasis:entry rowsep="1" colname="col3">0.46</oasis:entry>
         <oasis:entry rowsep="1" colname="col4">14.70</oasis:entry>
         <oasis:entry rowsep="1" colname="col5">7.64</oasis:entry>
         <oasis:entry rowsep="1" colname="col6"><inline-formula><mml:math id="M416" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">4.49</mml:mn></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">All</oasis:entry>
         <oasis:entry colname="col3">0.90</oasis:entry>
         <oasis:entry colname="col4">11.86</oasis:entry>
         <oasis:entry colname="col5">6.10</oasis:entry>
         <oasis:entry colname="col6">0.09</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">NAACOM</oasis:entry>
         <oasis:entry colname="col2">Training set</oasis:entry>
         <oasis:entry colname="col3">0.96</oasis:entry>
         <oasis:entry colname="col4">9.11</oasis:entry>
         <oasis:entry colname="col5">5.92</oasis:entry>
         <oasis:entry colname="col6">0.05</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Validation set</oasis:entry>
         <oasis:entry colname="col3">0.84</oasis:entry>
         <oasis:entry colname="col4">17.89</oasis:entry>
         <oasis:entry colname="col5">11.04</oasis:entry>
         <oasis:entry colname="col6">0.50</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" colname="col2">Independent test set</oasis:entry>
         <oasis:entry rowsep="1" colname="col3">0.64</oasis:entry>
         <oasis:entry rowsep="1" colname="col4">27.17</oasis:entry>
         <oasis:entry rowsep="1" colname="col5">18.86</oasis:entry>
         <oasis:entry rowsep="1" colname="col6">0.07</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">All</oasis:entry>
         <oasis:entry colname="col3">0.92</oasis:entry>
         <oasis:entry colname="col4">12.70</oasis:entry>
         <oasis:entry colname="col5">7.55</oasis:entry>
         <oasis:entry colname="col6">0.13</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>


</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title>Spatial distribution of the product bias</title>
      <p id="d2e5275">The ReCAD-NAACOM-<inline-formula><mml:math id="M417" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product exhibited a negligible area-mean bias of <inline-formula><mml:math id="M419" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">0.13</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M420" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm with a standard deviation of 12.70 <inline-formula><mml:math id="M421" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm when compared to all SOCAT observation grid cells across the entire NAACOM (Fig. 5 and Table 2). This small average difference suggests no consistent overestimation or underestimation by the regression model, indicating the reliability of the product in estimating the monthly and annual mean climatology of <inline-formula><mml:math id="M422" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the entire NAACOM region.</p>

      <fig id="Ch1.F5" specific-use="star"><label>Figure 5</label><caption><p id="d2e5339">Spatial distribution of the MBE between the ReCAD-NAACOM-<inline-formula><mml:math id="M424" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product and SOCAT observations across the NAACOM. The MBE is calculated for each grid cell as the average difference between product estimates and SOCAT observations. Positive values (red) indicate product overestimation, while negative values (blue) indicate underestimation relative to SOCAT. Regional MBE values with 1 standard deviation are shown for each subregion, corresponding to the values in the last column of Table 2. The overall bias error for the NAACOM is <inline-formula><mml:math id="M426" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">0.13</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M427" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 12.97 <inline-formula><mml:math id="M428" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm. Following Fennel et al. (2019), the study region is divided into six subregions using straight orange lines: the GoMx, SAB, MAB, GoMe, SS, and GStL&amp;GB. The thick black line is the 200 m isobath, which roughly marks the shelf break and typically defines the continental shelf boundary.</p></caption>
          <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f05.png"/>

        </fig>

      <p id="d2e5389">While the area-averaged difference is small, the differences are distributed heterogeneously in space. Larger differences (absolute difference <inline-formula><mml:math id="M429" display="inline"><mml:mrow><mml:mi mathvariant="italic">&gt;</mml:mi><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M430" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) tend to occur in nearshore regions, particularly along the coastlines of the GoMx and SAB, as well as in northern areas such as the GoMe, SS, and GStL&amp;GB (Fig. 5). These regional variations can be attributed to complex coastal processes such as terrestrial inputs, sparse observations in the northern areas (Lavoie et al., 2021; Rutherford et al., 2021; Salisbury and Jönsson, 2018), and less accurate satellite observations in the nearshore regions (Song et al., 2023). Conversely, smaller differences (absolute difference <inline-formula><mml:math id="M431" display="inline"><mml:mrow><mml:mi mathvariant="italic">&lt;</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M432" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) are observed in the central parts of the GoMx, offshore regions of the SAB and MAB, and some nearshore regions of the SS and GB, which is likely due to more stable oceanic conditions in those regions. The regional MBEs for different machine-learning development phases (training, validation, and test sets) are detailed in Table 2. Despite these regional differences, the MBEs of both the validation set (<inline-formula><mml:math id="M433" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1.0</mml:mn></mml:mrow></mml:math></inline-formula> to 1.0 <inline-formula><mml:math id="M434" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) and the independent test set (<inline-formula><mml:math id="M435" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">4.5</mml:mn></mml:mrow></mml:math></inline-formula> to 7.5 <inline-formula><mml:math id="M436" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm) demonstrate minimal values across the subregions (Table 2), underscoring the effectiveness of the product in capturing the broader <inline-formula><mml:math id="M437" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> patterns across the NAACOM.</p>
</sec>
<sec id="Ch1.S3.SS3">
  <label>3.3</label><title>Evaluating the capacity of the product to capture <inline-formula><mml:math id="M439" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> seasonality</title>
      <p id="d2e5506">One of the primary objectives of this product is to capture the seasonal cycle of <inline-formula><mml:math id="M441" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the NAACOM region. Figure 6 showcases the applicability of the product in capturing the <inline-formula><mml:math id="M443" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> seasonal cycles across the southern and northern areas of the NAACOM (red and blue boxes in Fig. 2). The comparison of monthly climatologies between the gap-filled product and SOCAT observations reveals strong agreement in the southern region despite the coverage difference, with the product-estimated monthly means being only 3.05 <inline-formula><mml:math id="M445" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 5.60 <inline-formula><mml:math id="M446" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm higher than those of SOCAT (Fig. 6a) and suggesting that our product effectively captures the seasonal cycle where data are abundant.</p>

      <fig id="Ch1.F6" specific-use="star"><label>Figure 6</label><caption><p id="d2e5559">Monthly mean climatology of <inline-formula><mml:math id="M447" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the southern and northern areas of the NAACOM from 1993 to 2021. The subregions are <bold>(a)</bold> the southern areas with the red box in Fig. 2 and <bold>(b)</bold> the northern areas with the blue box in Fig. 2. Two data representations are shown: (1) SOCAT observations (black curves), which may be influenced by missing data, and (2) the complete gap-filled product output (red curves). The error bars denote 1 standard deviation of the monthly mean climatology of <inline-formula><mml:math id="M449" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. The numbers indicate the mean difference (<inline-formula><mml:math id="M451" display="inline"><mml:mo lspace="0mm">±</mml:mo></mml:math></inline-formula> 1 standard deviation) in the monthly climatological <inline-formula><mml:math id="M452" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> calculated from the two sources, with positive values indicating higher product estimates compared to SOCAT observations. The <inline-formula><mml:math id="M454" display="inline"><mml:mi>x</mml:mi></mml:math></inline-formula> axis shows the months (1–12, where 1 represents January), and the <inline-formula><mml:math id="M455" display="inline"><mml:mi>y</mml:mi></mml:math></inline-formula> axis shows <inline-formula><mml:math id="M456" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (<inline-formula><mml:math id="M458" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm).</p></caption>
          <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f06.png"/>

        </fig>

      <p id="d2e5669">In the northern region where SOCAT data are sparse, the gap-filling ability of the product is also demonstrated well. In the northern region, the area-averaged monthly <inline-formula><mml:math id="M459" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> climatology calculated from the continuous reconstructed product is 22 <inline-formula><mml:math id="M461" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 11.12 <inline-formula><mml:math id="M462" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm lower than the SOCAT observations, which can be attributed to the limited observational coverage in this area. This area is characterized by sparse sampling, with the observational density approximately 50 % lower than in the southern region (Fig. 2) due to the smaller area and limited cruise coverage. For instance, the GStL region only has one summer cruise in the SOCAT database (Fig. 2b), and the SS and GoMe have particularly sparse winter observations (Fig. 2d). The higher latitudes typically exhibit larger seasonal amplitudes in <inline-formula><mml:math id="M463" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, making the limited sampling from SOCAT particularly problematic for accurate characterization. Our gap-free product provides comprehensive spatial and temporal coverage, enabling more robust analysis of <inline-formula><mml:math id="M465" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> patterns and variability in these historically undersampled regions.</p>
      <p id="d2e5737">Over the 29-year period, the product predicts smaller monthly standard deviations in the southern region (less than 40 <inline-formula><mml:math id="M467" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm; error bars in Fig. 6a), suggesting higher model accuracy and less interannual variability in these areas. Conversely, larger monthly standard deviations are observed in the northern areas, suggesting potentially lower accuracy and remarkable interannual variability. However, the larger interannual variability in these areas may be an artifact of the limited observational data available for regression model training, resulting in greater uncertainty in the predictions. Despite differences in the mean monthly climatology, the similar seasonal <inline-formula><mml:math id="M468" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> cycles calculated from SOCAT and the reconstructed product demonstrate the ability of the ReCAD-NAACOM-<inline-formula><mml:math id="M470" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product to represent seasonal <inline-formula><mml:math id="M472" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> variability across diverse coastal environments. Nevertheless, there exist larger differences between the observations and reconstructed <inline-formula><mml:math id="M474" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in some months and regions (Fig. 6b), highlighting the importance of the gap-free product in an unbiased understanding of regional carbon cycles (Ren et al., 2024). Detailed sea surface <inline-formula><mml:math id="M476" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> seasonal cycles and their controlling mechanisms across different subregions of the NAACOM will be presented in our subsequent work.</p>
</sec>
<sec id="Ch1.S3.SS4">
  <label>3.4</label><title>Evaluating the ability of the products to capture regional variation by comparing them to global products</title>
      <p id="d2e5837">The ReCAD-NAACOM-<inline-formula><mml:math id="M478" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product demonstrates the capability to resolve fine-scale regional spatial distributions of <inline-formula><mml:math id="M480" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. Figure 7 illustrates the spatial distribution of the annual mean climatology of <inline-formula><mml:math id="M482" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the NAACOM as observed by SOCAT and predicted by different global open- and coastal-ocean <inline-formula><mml:math id="M484" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products. Despite being affected by missing data, SOCAT observations (Fig. 7a) reveal significant regional variations in <inline-formula><mml:math id="M486" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. In the Louisiana Shelf (LAS) estuary plume region (box 1 in Fig. 7), <inline-formula><mml:math id="M488" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values consistently remain below 340 <inline-formula><mml:math id="M490" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, while the West Florida Shelf (WFS; box 2 in Fig. 7) exhibits elevated values exceeding 400 <inline-formula><mml:math id="M491" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm. These contrasting patterns have been reported in previous regional studies (Kealoha et al., 2020; Robbins et al., 2018; Wu et al., 2024b).</p>

      <fig id="Ch1.F7" specific-use="star"><label>Figure 7</label><caption><p id="d2e5956">Spatial distribution of the annual mean <inline-formula><mml:math id="M492" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> climatology in the NAACOM from different sources. <bold>(a)</bold> SOCAT observations, <bold>(b)</bold> the ReCAD-NAACOM-<inline-formula><mml:math id="M494" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product, <bold>(c)</bold> the ensemble mean of the seven global open-ocean <inline-formula><mml:math id="M496" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products listed in Table 1, and <bold>(d)</bold> the coastal <inline-formula><mml:math id="M498" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product ULB_SOMFFN_coastal_v2 (Roobaert et al., 2024a). The black contour delineates the coastal-ocean margin. The three boxes represent subregions in the NAACOM: box 1 for the Louisiana Shelf (LAS), box 2 for the West Florida Shelf (WFS), box 3 for the entire northern region, and box 4 for the southern GStL (S.GStL). Mean <inline-formula><mml:math id="M500" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> <inline-formula><mml:math id="M502" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> standard deviations of all the grid cells are provided for each dataset. The color scale represents <inline-formula><mml:math id="M503" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> (<inline-formula><mml:math id="M505" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm).</p></caption>
          <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f07.png"/>

        </fig>

      <p id="d2e6091">The ReCAD-NAACOM-<inline-formula><mml:math id="M506" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product demonstrates superior alignment with SOCAT observations in capturing those regional features that have been reported in previous observation-based studies (Fig. 7b), accurately representing the low <inline-formula><mml:math id="M508" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values in the LAS Mississippi River plume (box 1) and the elevated <inline-formula><mml:math id="M510" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> levels in the WFS (box 2). In contrast, the global reconstructions of <inline-formula><mml:math id="M512" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, represented by the ensemble of seven open-ocean <inline-formula><mml:math id="M514" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products (Fig. 7c), face challenges in resolving these regional <inline-formula><mml:math id="M516" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> variations, as previously discussed in Wu et al. (2024b). The coastal <inline-formula><mml:math id="M518" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product from Roobaert et al. (2024a; ULB_SOMFFN_coastal_v2) also captures some small-scale structures like the low <inline-formula><mml:math id="M520" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the LAS (Fig. 7d), but the ReCAD-NAACOM-<inline-formula><mml:math id="M522" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product exhibits values that are closer to the observations. In the northern region (box 3), the ReCAD-NAACOM-<inline-formula><mml:math id="M524" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product predicts higher <inline-formula><mml:math id="M526" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> levels that are closer to observations in the nearshore region (Fig. 7b). This is not surprising, as ULB_SOMFNN_coastal_v2 is a global product known for its high accuracy on the global average.</p>
      <p id="d2e6274">In addition to these previously documented regional variations, our product reveals several notable features not previously captured by observations or other existing products. For instance, the GoMe displays intermediate <inline-formula><mml:math id="M528" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> levels of around 380 <inline-formula><mml:math id="M530" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, which is distinctly higher than surrounding waters at comparable latitudes, a feature previously documented by a <inline-formula><mml:math id="M531" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product reconstructed using multiple linear regression (Signorini et al., 2013) and 5-year (2004–2009) mooring and cruise data (Vandemark et al., 2011). However, this contradicts two other studies based on numerical models (Cahill et al., 2016; Rutherford et al., 2021). In the southern GStL (S.GStL; box 4 in Fig. 7), <inline-formula><mml:math id="M533" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values are slightly higher compared to adjacent waters at similar latitudes, aligning with high nutrient concentrations typically observed in these river-influenced waters (Lavoie et al., 2021). These regional patterns could not be captured completely by the global products (Fig. 7c and d). The ability of the ReCAD-NAACOM-<inline-formula><mml:math id="M535" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product to resolve such regional features demonstrates its potential value for investigating coastal carbon dynamics and their responses to local and regional forcing factors in the NAACOM.</p>
</sec>
<sec id="Ch1.S3.SS5">
  <label>3.5</label><title>Evaluating the capacity of the product to detect decadal linear trends of <inline-formula><mml:math id="M537" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub></title>
      <p id="d2e6375">Using <inline-formula><mml:math id="M539" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> products to accurately reconstruct <inline-formula><mml:math id="M541" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> linear trends in coastal regions presents significant challenges due to the high spatial heterogeneity of coastal <inline-formula><mml:math id="M543" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> dynamics. This heterogeneity often leads to sea surface <inline-formula><mml:math id="M545" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> changes that deviate from atmospheric trends (Laruelle et al., 2018). Even when utilizing similar observational datasets, derived products may not consistently reflect the underlying trends. For instance, Wu et al. (2024b) examined the ability of various products to reflect <inline-formula><mml:math id="M547" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> changes in the GoMx, a region where <inline-formula><mml:math id="M549" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> trends exhibit significant spatial variability. Despite this heterogeneity, seven global open-ocean products (listed in Table 1) indicate trends similar to atmospheric <inline-formula><mml:math id="M551" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the entire GoMx without regional differences. In contrast, the GoMx-specific regional product developed by Chen and Hu (2019) demonstrates no significant overall trend. The discrepancy in trend detection stems primarily from the design of the regression model and the selection of the input variables. These factors are critical in capturing the complex spatiotemporal variability of coastal <inline-formula><mml:math id="M553" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and its long-term evolution.</p>
      <p id="d2e6508">To assess the capability of the product in resolving decadal <inline-formula><mml:math id="M555" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> trends, we conducted an analysis of the <inline-formula><mml:math id="M557" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> evolution using three distinct regions within the NAACOM (three boxes in Fig. 7) as representative examples (Fig. 8). Decadal trends of deseasonalized time series were calculated following the protocol established by Sutton et al. (2022). The LAS (box 1 in Fig. 7) has been identified as an increasing CO<sub>2</sub> sink characterized by a negative <inline-formula><mml:math id="M560" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> rate increase from 2002 to 2021 (Wu et al., 2024b). Our product results for the extended period of 1993–2021 indicate that <inline-formula><mml:math id="M562" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> increased at a rate of <inline-formula><mml:math id="M564" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">0.44</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M565" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.11 <inline-formula><mml:math id="M566" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm yr<sup>−1</sup> (Fig. 8a). This rate is significantly lower than the observed atmospheric <inline-formula><mml:math id="M568" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> increase in this region during 2002–2021, which is approximately <inline-formula><mml:math id="M570" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1.8</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M571" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm yr<sup>−1</sup>. These findings corroborate our previous conclusion that the LAS is an increasing CO<sub>2</sub> sink, demonstrating the capability of our product in revealing long-term <inline-formula><mml:math id="M574" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> trends in this dynamic river plume region, extending the analysis period by nearly a decade compared to previous studies. In contrast, the WFS (box 2 in Fig. 7) exhibits an accelerated <inline-formula><mml:math id="M576" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> increase that is faster than the atmospheric <inline-formula><mml:math id="M578" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> of around <inline-formula><mml:math id="M580" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.0</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M581" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm yr<sup>−1</sup> (Fig. 8b), aligning with observations reported by Robbins et al. (2018), who found a transition from a CO<sub>2</sub> sink to a source in this region during the 1990s.</p>
      <p id="d2e6767">Both ReCAD-NAACOM-<inline-formula><mml:math id="M584" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and SOCAT consistently report a <inline-formula><mml:math id="M586" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> trend of around <inline-formula><mml:math id="M588" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.3</mml:mn></mml:mrow></mml:math></inline-formula> to <inline-formula><mml:math id="M589" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.5</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M590" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm yr<sup>−1</sup> in the northern region (box 3 in Fig. 7) over 1993–2021 (Fig. 8c), which is faster than the atmospheric <inline-formula><mml:math id="M592" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> increase (around <inline-formula><mml:math id="M594" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">2.0</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M595" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm yr<sup>−1</sup>), suggesting that these areas are becoming a decreasing CO<sub>2</sub> sink. However, limited observational data in this area necessitate cautious interpretation and warrant further validation in future research. Overall, the spatiotemporal heterogeneity in surface-ocean <inline-formula><mml:math id="M598" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> trends across the NAACOM underscores the importance of long-term monitoring to elucidate the drivers of these trends, particularly in regions influenced by major current systems and in areas with limited observational data.</p>

      <fig id="Ch1.F8" specific-use="star"><label>Figure 8</label><caption><p id="d2e6918">Decadal linear trends of sea surface <inline-formula><mml:math id="M600" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in three regions of the NAACOM from 1993 to 2021. The blue and red dots are monthly average <inline-formula><mml:math id="M602" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values (deseasonalized) calculated from SOCAT observations and the reconstructed ReCAD-NAACOM-<inline-formula><mml:math id="M604" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, respectively. The thick lines are linear fitted regression lines. The three regions are the boxes in Fig. 7: the <bold>(a)</bold> LAS (northern Gulf of Mexico shelf river plume region), <bold>(b)</bold> WFS, and <bold>(c)</bold> northern areas. Linear trends are calculated following the protocol established by Sutton et al. (2022). The numbers in parentheses are the number of months with data and <inline-formula><mml:math id="M606" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula> values.</p></caption>
          <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f08.png"/>

        </fig>

</sec>
<sec id="Ch1.S3.SS6">
  <label>3.6</label><title>Evaluating the uncertainty of the product</title>
      <p id="d2e7000">The uncertainty of the reconstructed <inline-formula><mml:math id="M607" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values in each grid cell was estimated by accumulating uncertainties from mapping (<inline-formula><mml:math id="M609" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), gridding (<inline-formula><mml:math id="M610" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), measurement (<inline-formula><mml:math id="M611" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), and input variables (<inline-formula><mml:math id="M612" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>; see Sect. 2.5 for further details on the calculation). To maintain a conservative estimate, we adopted the larger value of 5 <inline-formula><mml:math id="M613" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm as <inline-formula><mml:math id="M614" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> for all the data points. The gridded <inline-formula><mml:math id="M615" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values from SOCAT are reported as the averages of all samples collected within each grid cell. Accordingly, <inline-formula><mml:math id="M617" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> was quantified as the standard deviation of samples within each grid cell, calculated across six subregions. Following the previous literature (Roobaert et al., 2024a; Sharp et al., 2022), <inline-formula><mml:math id="M618" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> was calculated using the RMSE values of the model validation phase reported in Table 2. The uncertainty from the validation set (20 % of X1) was chosen for its sample size that was larger than the independent test set (X2) and for consistency with the 10-fold cross-validation results while avoiding potential underestimation from the training set. <inline-formula><mml:math id="M619" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> was calculated using a Monte Carlo simulation (Appendix B). These four sources of uncertainty were evaluated across different subregions of the NAACOM, as shown in Table 3. <inline-formula><mml:math id="M620" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> contributes the largest portion to the total number of uncertainties across all the sub-subregions, with a maximum value of up to 20.12 <inline-formula><mml:math id="M621" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm in the GoMe. Overall, the ReCAD-NAACOM-<inline-formula><mml:math id="M622" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product demonstrates uncertainties ranging from 16 to 28 <inline-formula><mml:math id="M624" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm across the six subregions and an average uncertainty of 23.25 <inline-formula><mml:math id="M625" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm for the entire NAACOM.</p>

<table-wrap id="Ch1.T3"><label>Table 3</label><caption><p id="d2e7188">Uncertainty estimates for the ReCAD-NAACOM-<inline-formula><mml:math id="M626" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product across the different subregions of the NAACOM. <inline-formula><mml:math id="M628" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M629" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M630" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula><mml:math id="M631" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> represent the measurement uncertainty, gridding uncertainty, mapping uncertainty, and uncertainty accumulated from input variables, respectively (see Sect. 2.5 for further details). <inline-formula><mml:math id="M632" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:msub><mml:mi>p</mml:mi><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the total combined uncertainty (<inline-formula><mml:math id="M633" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm). The subregions are the GoMx, SAB, MAB, GoMe, SS, and GStL&amp;GB.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="6">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Region</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M634" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M635" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">grid</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M636" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">map</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M637" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col6"><inline-formula><mml:math id="M638" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:msub><mml:mi>p</mml:mi><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">GStL&amp;GB</oasis:entry>
         <oasis:entry colname="col2">5.00</oasis:entry>
         <oasis:entry colname="col3">15.44</oasis:entry>
         <oasis:entry colname="col4">13.57</oasis:entry>
         <oasis:entry colname="col5">5.57</oasis:entry>
         <oasis:entry colname="col6">21.88</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">SS</oasis:entry>
         <oasis:entry colname="col2">5.00</oasis:entry>
         <oasis:entry colname="col3">15.37</oasis:entry>
         <oasis:entry colname="col4">13.27</oasis:entry>
         <oasis:entry colname="col5">6.18</oasis:entry>
         <oasis:entry colname="col6">21.80</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">GoMe</oasis:entry>
         <oasis:entry colname="col2">5.00</oasis:entry>
         <oasis:entry colname="col3">16.05</oasis:entry>
         <oasis:entry colname="col4">20.12</oasis:entry>
         <oasis:entry colname="col5">7.51</oasis:entry>
         <oasis:entry colname="col6">27.27</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">MAB</oasis:entry>
         <oasis:entry colname="col2">5.00</oasis:entry>
         <oasis:entry colname="col3">16.14</oasis:entry>
         <oasis:entry colname="col4">19.49</oasis:entry>
         <oasis:entry colname="col5">5.97</oasis:entry>
         <oasis:entry colname="col6">26.48</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">SAB</oasis:entry>
         <oasis:entry colname="col2">5.00</oasis:entry>
         <oasis:entry colname="col3">8.29</oasis:entry>
         <oasis:entry colname="col4">12.03</oasis:entry>
         <oasis:entry colname="col5">5.99</oasis:entry>
         <oasis:entry colname="col6">16.57</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">GoMx</oasis:entry>
         <oasis:entry colname="col2">5.00</oasis:entry>
         <oasis:entry colname="col3">10.38</oasis:entry>
         <oasis:entry colname="col4">19.08</oasis:entry>
         <oasis:entry colname="col5">5.55</oasis:entry>
         <oasis:entry colname="col6">22.97</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">NAACOM</oasis:entry>
         <oasis:entry colname="col2">5.00</oasis:entry>
         <oasis:entry colname="col3">12.69</oasis:entry>
         <oasis:entry colname="col4">17.89</oasis:entry>
         <oasis:entry colname="col5">5.86</oasis:entry>
         <oasis:entry colname="col6">23.25</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e7531">Our uncertainty estimation employs a conservative estimation using maximum values at the calculation step. This approach likely overestimates the true uncertainty. Despite this conservative method, our calculated uncertainty for the Atlantic margins is comparable to the 43.4 <inline-formula><mml:math id="M639" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm reported by Sharp et al. (2022) for areas within 100 km of the North American Pacific margins, suggesting good performance of our product. It is important to note that our uncertainty calculation assumed independence among all the sources, which is a simplification. Recent research has highlighted that these uncertainties are often correlated (Ford et al., 2024). Future studies should consider these inter-variable correlations to refine uncertainty estimates. In addition, the uncertainties reported in this section and provided in the NetCDF file represent the propagated errors for individual <inline-formula><mml:math id="M640" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> values in each grid cell. Methods to calculate uncertainties in regional averages of <inline-formula><mml:math id="M642" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> or air–sea CO<sub>2</sub> fluxes over specific spatial and temporal domains are detailed in Roobaert et al. (2024a) and Landschützer et al. (2014).</p>
</sec>
<sec id="Ch1.S3.SS7">
  <label>3.7</label><title>Challenges and limitations</title>
      <p id="d2e7592">Even though ReCAD-NAACOM-<inline-formula><mml:math id="M645" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> resolves regional <inline-formula><mml:math id="M647" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> variability with high accuracy in the NAACOM, this product still has room for improvement in the future. Potential areas of improvement include the 0.25° spatial resolution, which is inadequate for resolving submesoscale variability at the scale of 0.1–10 km (McWilliams, 1985). Furthermore, during the independent validation phase, the accuracy of the model-predicted values decreased in the GoMe (<inline-formula><mml:math id="M649" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.49</mml:mn></mml:mrow></mml:math></inline-formula>) and GoMx (<inline-formula><mml:math id="M650" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.46</mml:mn></mml:mrow></mml:math></inline-formula>) (Table 2), which may be due to the complex biological and physical conditions in the estuary plume regions in these two gulfs. In this study, we opted not to include chlorophyll-<inline-formula><mml:math id="M651" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> (Chl-<inline-formula><mml:math id="M652" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula>) concentrations and wind speeds as input variables for model training and prediction. This decision was primarily due to the limited temporal coverage of satellite-derived Chl-<inline-formula><mml:math id="M653" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> data, which only extends back to 1997 with the launch of the Sea-viewing Wide Field-of-view Sensor (SeaWiFS) satellite (O'Reilly et al., 1998). The inclusion of Chl-<inline-formula><mml:math id="M654" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> would have restricted the temporal range of our model, potentially limiting its ability to capture long-term trends and variability in <inline-formula><mml:math id="M655" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>. Future versions of our model will aim to address this limitation. One potential approach is to develop a two-phase model: one phase for the period before 1997 without Chl-<inline-formula><mml:math id="M657" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> data and another for the post-1997 period incorporating Chl-<inline-formula><mml:math id="M658" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> information. Alternatively, we may explore methods to reconstruct historical Chl-<inline-formula><mml:math id="M659" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> data or use proxy variables that correlate with biological productivity and are available for the entire study period.</p>
      <p id="d2e7724">In our previous work, we demonstrated that incorporating wind speeds and sea surface roughness data derived from synthetic aperture radar (SAR) could enhance model performance in predicting <inline-formula><mml:math id="M660" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> at submesoscale resolutions (Wang et al., 2024). In this work, we evaluated the inclusion of wind speed as an input variable in our model. However, at the 0.25° resolution employed here, the addition of wind speed data did not significantly improve the model performance (it only increased the <inline-formula><mml:math id="M662" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> by 0.1). Moreover, when using the same Monte Carlo simulation approach applied to other variables, incorporating wind speeds would introduce an additional 6 <inline-formula><mml:math id="M663" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm uncertainty to <inline-formula><mml:math id="M664" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> estimates, doubling the input-related uncertainties. Consequently, we excluded wind speeds from our regression model to reduce input-related uncertainties. Despite this omission, our product demonstrates robust capability in resolving regional variations, seasonal cycles, and decadal trends in <inline-formula><mml:math id="M666" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, making it valuable for future studies.</p>
</sec>
</sec>
<sec id="Ch1.S4">
  <label>4</label><title>Data availability</title>
      <p id="d2e7804">The reconstructed <inline-formula><mml:math id="M668" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and <inline-formula><mml:math id="M670" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and the uncertainty in ReCAD (v1.1) are available as a NetCDF file at <uri>https://doi.org/10.5281/zenodo.14038561</uri> (Wu et al., 2024a) and will be updated regularly.</p>
</sec>
<sec id="Ch1.S5">
  <label>5</label><title>Code availability</title>
      <p id="d2e7851">The Python and MATLAB code used to process the data and create the figures included in this paper is provided at <uri>https://github.com/zelunwu/ReCAD</uri> (Wu, 2024).</p>
</sec>
<sec id="Ch1.S6" sec-type="conclusions">
  <label>6</label><title>Conclusions</title>
      <p id="d2e7865">The ReCAD-NAACOM-<inline-formula><mml:math id="M672" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product developed in this study represents a significant advancement in our ability to detect the spatial variations, seasonal cycles, and decadal changes of surface-ocean <inline-formula><mml:math id="M674" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> dynamics in the NAACOM. By leveraging a two-step approach combining random forest and linear regression and a set of environmental predictors, we have created a high-resolution, long-term dataset (1993–2021 period) that captures the complex spatial and temporal variability of <inline-formula><mml:math id="M676" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the region. On average, compared with all available samples from the SOCAT observations in our study region, the product has an <inline-formula><mml:math id="M678" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> of 0.92, an RMSE of 12.70 <inline-formula><mml:math id="M679" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, an MAE of 7.55 <inline-formula><mml:math id="M680" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm, and an MBE of 0.13 <inline-formula><mml:math id="M681" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm for the entire NAACOM, with an average uncertainty of 23.25 <inline-formula><mml:math id="M682" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm. The key findings from this study are the following: <list list-type="order"><list-item>
      <p id="d2e7963">The product demonstrates high accuracy and reliability, as evidenced by strong performance metrics during the training, validation, and independent test phases across the six subregions.</p></list-item><list-item>
      <p id="d2e7967">Distinct seasonal cycles are observed between the southern and northern subregions, with the product capturing nuanced features such as elevated <inline-formula><mml:math id="M683" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> levels during fall and winter in the northern areas.</p></list-item><list-item>
      <p id="d2e7987">Comparison with global products highlights the superior ability of the ReCAD-NAACOM-<inline-formula><mml:math id="M685" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product to resolve small-scale coastal features and variability.</p></list-item><list-item>
      <p id="d2e8007">The <inline-formula><mml:math id="M687" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product successfully reconstructed decadal linear trends that were consistent with previous studies while also revealing a rapid increase in <inline-formula><mml:math id="M689" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the northern region of the NAACOM.</p></list-item></list> While areas of future improvement exist, such as increasing spatial resolution and enhancing accuracy in estuary-plume-influenced regions, the ReCAD-NAACOM-<inline-formula><mml:math id="M691" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product provides a robust foundation for studying coastal carbon dynamics. This dataset will be valuable for investigating air–sea CO<sub>2</sub> fluxes, assessing ocean acidification impacts, and understanding the role of coastal systems in the NAACOM.</p>
      <p id="d2e8068">Future research should validate the reconstructed trends, particularly in areas with limited observational data, and explore the mechanisms driving the spatiotemporal variability in <inline-formula><mml:math id="M694" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> across the NAACOM region. Additionally, the methodologies developed here can contribute to a more comprehensive understanding of coastal-ocean carbon dynamics in the face of climate change and have the potential to be applied globally.</p>
</sec>

      
      </body>
    <back><app-group>

<app id="App1.Ch1.S1">
  <label>Appendix A</label><title>Before and after LR calibration</title>

      <fig id="App1.Ch1.S1.F9"><label>Figure A1</label><caption><p id="d2e8100">Comparisons of the monthly <inline-formula><mml:math id="M696" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> climatology with SOCAT observations across the six subregions: evaluations before and after LR calibration. Values indicate the mean difference (<inline-formula><mml:math id="M698" display="inline"><mml:mo lspace="0mm">±</mml:mo></mml:math></inline-formula> 1 standard deviation; blue: before LR and red: after LR) between model-estimated <inline-formula><mml:math id="M699" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and SOCAT observations over the 12-month period, computed only at grid points and times where SOCAT measurements are available.</p></caption>
        
        <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f09.png"/>

      </fig>

<fig id="App1.Ch1.S1.F10"><label>Figure A2</label><caption><p id="d2e8153">Comparisons of deseasonalized monthly <inline-formula><mml:math id="M701" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> anomalies with SOCAT observations across the six subregions: evaluations before and after LR calibration. Values indicate the <inline-formula><mml:math id="M703" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> and RMSE between model-estimated <inline-formula><mml:math id="M704" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and SOCAT observations (blue: before LR; red: after LR), computed only at grid points and times where SOCAT measurements are available.</p></caption>
        
        <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f10.png"/>

      </fig>

</app>

<app id="App1.Ch1.S2">
  <label>Appendix B</label><title>Monte Carlo simulation in calculating <inline-formula><mml:math id="M706" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula></title>
      <p id="d2e8226">A crucial step in calculating <inline-formula><mml:math id="M707" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is determining the uncertainties of the input variables. In our reconstructed model, there were four variables that needed to be evaluated: SST, SSS, SSH, and <inline-formula><mml:math id="M708" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub>. Our general principle was to adopt conservative estimates, using the largest reported uncertainty for each product when available.</p>
      <p id="d2e8259">SST errors are provided within the OISST product at the grid level. On the global average, OISST reports a mean bias and RMSE of <inline-formula><mml:math id="M710" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.04</mml:mn></mml:mrow></mml:math></inline-formula> and 0.24 °C when compared with the observations on the global average (Huang et al., 2021). For our study region, we calculated the mean SST error across all the grid cells, yielding a value of 0.23 °C.</p>
      <p id="d2e8272">The SODA database assimilates observational data but does not directly provide SSS error estimates. Given this limitation in uncertainty reporting, we derived an estimate based on the RMSE between the model SSS and observations near our study region, as reported by Carton et al. (2018). Their analysis (their Fig. 8) indicates an RMSE exceeding 0.3 psu in the vicinity of our area of interest. In addition, interpolating the 0.5° SSS data to 0.25° resolution could potentially introduce more errors. To maintain a conservative approach in our uncertainty quantification, we doubled the uncertainty and adopted a value of 0.6 psu as the SSS uncertainty for our calculations.</p>
      <p id="d2e8276">SSH errors are directly provided in the dataset, which has a mean uncertainty of 1.8 cm in our study region.</p>
      <p id="d2e8280"><inline-formula><mml:math id="M711" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2air</sub>, calculated from xCO<sub>2air</sub> (MBL references), has a global mean uncertainty of 0.22 ppm.</p>
      <p id="d2e8314">To propagate these input uncertainties to the final <inline-formula><mml:math id="M714" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> estimate, a Monte Carlo simulation approach was implemented: <list list-type="order"><list-item>
      <p id="d2e8335">For each input variable <inline-formula><mml:math id="M716" display="inline"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, random perturbations <inline-formula><mml:math id="M717" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="italic">ε</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> were generated following a normal distribution <inline-formula><mml:math id="M718" display="inline"><mml:mrow><mml:mi>N</mml:mi><mml:mo>(</mml:mo><mml:mn mathvariant="normal">0</mml:mn><mml:mo>,</mml:mo><mml:msub><mml:mi>u</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="M719" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> represents the uncertainty of the respective variable listed above.</p></list-item><list-item>
      <p id="d2e8393">Perturbed inputs (<inline-formula><mml:math id="M720" display="inline"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi mathvariant="italic">ε</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) were used to calculate <inline-formula><mml:math id="M721" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> with the established model.</p></list-item><list-item>
      <p id="d2e8431">The difference (<inline-formula><mml:math id="M723" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">Δ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) between the reconstructed <inline-formula><mml:math id="M724" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> before and after adding the perturbation was computed.</p></list-item><list-item>
      <p id="d2e8462">Steps 1, 2, and 3 were iterated 100 times for each input variable.</p></list-item><list-item>
      <p id="d2e8466">The uncertainty contribution from each variable was quantified as the standard deviation of the 100 <inline-formula><mml:math id="M726" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">Δ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> values in each grid cell.</p></list-item></list> The total uncertainty attributed to the input variables (<inline-formula><mml:math id="M727" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) was then calculated as the square root of the quadratic sum of individual uncertainties: 
          <disp-formula id="App1.Ch1.S2.E9" content-type="numbered"><label>B1</label><mml:math id="M728" display="block"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:msubsup><mml:mi>u</mml:mi><mml:mi mathvariant="normal">SST</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>u</mml:mi><mml:mi mathvariant="normal">SSS</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>u</mml:mi><mml:mi mathvariant="normal">SSH</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>u</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow class="chem"><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi mathvariant="normal">air</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:msqrt><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d2e8555">The largest uncertainties propagated from these variables are sourced from SSS and SSH (Fig. B1a and c). Simulating salinity in coastal regions is still challenging due to complex land–ocean interaction. For the SSH, the greatest uncertainties were observed in the GoMe and GStL. Overall, <inline-formula><mml:math id="M729" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is largest in the West Florida Shelf and nearshore waters around the GoMe, with a mean <inline-formula><mml:math id="M730" display="inline"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mi mathvariant="normal">inputs</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> uncertainty of 5.9 <inline-formula><mml:math id="M731" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 4.7 <inline-formula><mml:math id="M732" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>atm for the entire NAACOM.</p>

      <fig id="App1.Ch1.S2.F11"><label>Figure B1</label><caption><p id="d2e8597">Uncertainties of <inline-formula><mml:math id="M733" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> accumulated from the different input variables of the model.</p></caption>
        
        <graphic xlink:href="https://essd.copernicus.org/articles/17/43/2025/essd-17-43-2025-f11.png"/>

      </fig>

</app>
  </app-group><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e8628">ZW: conceptualization, data curation, formal analysis, methodology, software, visualization, writing – original draft preparation, writing – review and editing. WL: funding acquisition, methodology, validation, writing – review and editing. AR: validation, writing – review and editing. LS: validation, writing – review and editing. XHY: project administration, supervision. WJC: conceptualization, project administration, supervision, validation, writing – review and editing.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e8634">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e8640">Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. While Copernicus Publications makes every effort to include appropriate place names, the final responsibility lies with the authors.</p>
  </notes><ack><title>Acknowledgements</title><p id="d2e8648">The authors acknowledge the NOAA for providing the OISST data, the University of Maryland Ocean Climate Laboratory for the SODA dataset, and the European Union's CMEMS for the SSH data. We also express our gratitude to the scientific community for sharing their observational carbonate data in the SOCAT effort. SOCAT is an international effort endorsed by the International Ocean Carbon Coordination Project (IOCCP), the Surface Ocean Lower Atmosphere Study (SOLAS), and the Integrated Marine Biosphere Research (IMBeR) program to deliver a uniform quality-controlled surface-ocean CO<sub>2</sub> database. The many researchers and funding agencies responsible for the collection of the data and the quality control are thanked for their contributions to SOCAT. We would also like to thank Fujian Satellite Date Development Company Ltd. and Fujian Hisea Digital Technology Company Ltd. for their cooperation in the <inline-formula><mml:math id="M736" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> application. We would also like to thank the editor and two anonymous reviewers for their efforts in improving this work.</p><p id="d2e8675">This work is part of Zelun Wu's PhD dissertation in the framework of the University of Delaware–Xiamen University Dual Degree Program in Oceanography.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e8681">This research has been supported by the Southern Marine Science and Engineering Guangdong Laboratory (Zhuhai) (grant no. SML2023SP238) for Wenfang Lu, the Industry-University Cooperation and Collaborative Education Projects (grant no. 202102245034), and the PhD fellowship from the State Key Laboratory of Marine Environmental Science at Xiamen University for Zelun Wu.</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e8687">This paper was edited by Sabine Schmidt and reviewed by two anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bib1"><label>1</label><mixed-citation>Bakker, D. C. E., Pfeil, B., Landa, C. S., Metzl, N., O'Brien, K. M., Olsen, A., Smith, K., Cosca, C., Harasawa, S., Jones, S. D., Nakaoka, S., Nojiri, Y., Schuster, U., Steinhoff, T., Sweeney, C., Takahashi, T., Tilbrook, B., Wada, C., Wanninkhof, R., Alin, S. R., Balestrini, C. F., Barbero, L., Bates, N. R., Bianchi, A. A., Bonou, F., Boutin, J., Bozec, Y., Burger, E. F., Cai, W.-J., Castle, R. D., Chen, L., Chierici, M., Currie, K., Evans, W., Featherstone, C., Feely, R. A., Fransson, A., Goyet, C., Greenwood, N., Gregor, L., Hankin, S., Hardman-Mountford, N. J., Harlay, J., Hauck, J., Hoppema, M., Humphreys, M. P., Hunt, C. W., Huss, B., Ibánhez, J. S. P., Johannessen, T., Keeling, R., Kitidis, V., Körtzinger, A., Kozyr, A., Krasakopoulou, E., Kuwata, A., Landschützer, P., Lauvset, S. K., Lefèvre, N., Lo Monaco, C., Manke, A., Mathis, J. T., Merlivat, L., Millero, F. J., Monteiro, P. M. S., Munro, D. R., Murata, A., Newberger, T., Omar, A. M., Ono, T., Paterson, K., Pearce, D., Pierrot, D., Robbins, L. L., Saito, S., Salisbury, J., Schlitzer, R., Schneider, B., Schweitzer, R., Sieger, R., Skjelvan, I., Sullivan, K. F., Sutherland, S. C., Sutton, A. J., Tadokoro, K., Telszewski, M., Tuma, M., van Heuven, S. M. A. C., Vandemark, D., Ward, B., Watson, A. J., and Xu, S.: A multi-decade record of high-quality fCO2 data in version 3 of the Surface Ocean CO2 Atlas (SOCAT), Earth Syst. Sci. Data, 8, 383–413, <ext-link xlink:href="https://doi.org/10.5194/essd-8-383-2016" ext-link-type="DOI">10.5194/essd-8-383-2016</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib2"><label>2</label><mixed-citation>Breiman, L.: Random Forests, Machine Learning, 45, 5–32, <ext-link xlink:href="https://doi.org/10.1023/A:1010933404324" ext-link-type="DOI">10.1023/A:1010933404324</ext-link>, 2001.</mixed-citation></ref>
      <ref id="bib1.bib3"><label>3</label><mixed-citation>Cahill, B., Wilkin, J., Fennel, K., Vandemark, D., and Friedrichs, M. A. M.: Interannual and seasonal variabilities in air-sea CO<sub>2</sub> fluxes along the U.S. eastern continental shelf and their sensitivity to increasing air temperatures and variable winds: U.S. East Coast Shelf Air-Sea CO<sub>2</sub> Fluxes, J. Geophys. Res.-Biogeo., 121, 295–311, <ext-link xlink:href="https://doi.org/10.1002/2015JG002939" ext-link-type="DOI">10.1002/2015JG002939</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib4"><label>4</label><mixed-citation>Cai, W.-J., Xu, Y.-Y., Feely, R. A., Wanninkhof, R., Jönsson, B., Alin, S. R., Barbero, L., Cross, J. N., Azetsu-Scott, K., Fassbender, A. J., Carter, B. R., Jiang, L.-Q., Pepin, P., Chen, B., Hussain, N., Reimer, J. J., Xue, L., Salisbury, J. E., Hernández-Ayón, J. M., Langdon, C., Li, Q., Sutton, A. J., Chen, C.-T. A., and Gledhill, D. K.: Controls on surface water carbonate chemistry along North American ocean margins, Nat. Commun., 11, 2691, <ext-link xlink:href="https://doi.org/10.1038/s41467-020-16530-z" ext-link-type="DOI">10.1038/s41467-020-16530-z</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib5"><label>5</label><mixed-citation>Carter, B. R., Feely, R. A., Williams, N. L., Dickson, A. G., Fong, M. B., and Takeshita, Y.: Updated methods for global locally interpolated estimation of alkalinity, pH, and nitrate: LIR: Global alkalinity, pH, and nitrate estimates, Limnol. Oceanogr. Methods, 16, 119–131, <ext-link xlink:href="https://doi.org/10.1002/lom3.10232" ext-link-type="DOI">10.1002/lom3.10232</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib6"><label>6</label><mixed-citation>Carton, J. A., Chepurin, G. A., and Chen, L.: SODA3: A New Ocean Climate Reanalysis, J. Climate, 31, 6967–6983, <ext-link xlink:href="https://doi.org/10.1175/JCLI-D-18-0149.1" ext-link-type="DOI">10.1175/JCLI-D-18-0149.1</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib7"><label>7</label><mixed-citation>Chau, T. T. T., Gehlen, M., and Chevallier, F.: A seamless ensemble-based reconstruction of surface ocean <inline-formula><mml:math id="M740" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> and air–sea CO<sub>2</sub> fluxes over the global coastal and open oceans, Biogeosciences, 19, 1087–1109, <ext-link xlink:href="https://doi.org/10.5194/bg-19-1087-2022" ext-link-type="DOI">10.5194/bg-19-1087-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib8"><label>8</label><mixed-citation>Chen, C.-T. A., Huang, T.-H., Chen, Y.-C., Bai, Y., He, X., and Kang, Y.: Air–sea exchanges of CO<sub>2</sub> in the world's coastal seas, Biogeosciences, 10, 6509–6544, <ext-link xlink:href="https://doi.org/10.5194/bg-10-6509-2013" ext-link-type="DOI">10.5194/bg-10-6509-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib9"><label>9</label><mixed-citation>Chen, S. and Hu, C.: Environmental controls of surface water <inline-formula><mml:math id="M744" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in different coastal environments: Observations from marine buoys, Cont. Shelf Res., 183, 73–86, <ext-link xlink:href="https://doi.org/10.1016/j.csr.2019.06.007" ext-link-type="DOI">10.1016/j.csr.2019.06.007</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib10"><label>10</label><mixed-citation>E.U. Copernicus Marine Service Information (CMEMS): Global Ocean Gridded L4 Sea Surface Heights and Derived Variables Reprocessed (1993–ongoing), [data set], <ext-link xlink:href="https://doi.org/10.48670/moi-00148" ext-link-type="DOI">10.48670/moi-00148</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib11"><label>11</label><mixed-citation>Dai, M., Su, J., Zhao, Y., Hofmann, E. E., Cao, Z., Cai, W.-J., Gan, J., Lacroix, F., Laruelle, G. G., Meng, F., Müller, J. D., Regnier, P. A. G., Wang, G., and Wang, Z.: Carbon Fluxes in the Coastal Ocean: Synthesis, Boundary Processes and Future Trends, Annu. Rev. Earth Planet. Sci., 50, 593–626, <ext-link xlink:href="https://doi.org/10.1146/annurev-earth-032320-090746" ext-link-type="DOI">10.1146/annurev-earth-032320-090746</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib12"><label>12</label><mixed-citation>Fay, A. R., Gregor, L., Landschützer, P., McKinley, G. A., Gruber, N., Gehlen, M., Iida, Y., Laruelle, G. G., Rödenbeck, C., Roobaert, A., and Zeng, J.: SeaFlux: harmonization of air–sea CO<sub>2</sub> fluxes from surface <inline-formula><mml:math id="M747" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> data products using a standardized approach, Earth Syst. Sci. Data, 13, 4693–4710, <ext-link xlink:href="https://doi.org/10.5194/essd-13-4693-2021" ext-link-type="DOI">10.5194/essd-13-4693-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib13"><label>13</label><mixed-citation>Fennel, K. and Wilkin, J.: Quantifying biological carbon export for the northwest North Atlantic continental shelves, Geophys. Res. Lett., 36, L18605, <ext-link xlink:href="https://doi.org/10.1029/2009GL039818" ext-link-type="DOI">10.1029/2009GL039818</ext-link>, 2009.</mixed-citation></ref>
      <ref id="bib1.bib14"><label>14</label><mixed-citation>Fennel, K., Alin, S., Barbero, L., Evans, W., Bourgeois, T., Cooley, S., Dunne, J., Feely, R. A., Hernandez-Ayon, J. M., Hu, X., Lohrenz, S., Muller-Karger, F., Najjar, R., Robbins, L., Shadwick, E., Siedlecki, S., Steiner, N., Sutton, A., Turk, D., Vlahos, P., and Wang, Z. A.: Carbon cycling in the North American coastal ocean: a synthesis, Biogeosciences, 16, 1281–1304, <ext-link xlink:href="https://doi.org/10.5194/bg-16-1281-2019" ext-link-type="DOI">10.5194/bg-16-1281-2019</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib15"><label>15</label><mixed-citation>Ford, D. J., Blannin, J., Watts, J., Watson, A. J., Landschützer, P., Jersild, A., and Shutler, J. D.: A Comprehensive Analysis of Air-Sea CO<sub>2</sub> Flux Uncertainties Constructed From Surface Ocean Data Products, Global Biogeochem. Cy., 38, e2024GB008188, <ext-link xlink:href="https://doi.org/10.1029/2024GB008188" ext-link-type="DOI">10.1029/2024GB008188</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib16"><label>16</label><mixed-citation>Friedlingstein, P., O'Sullivan, M., Jones, M. W., Andrew, R. M., Bakker, D. C. E., Hauck, J., Landschützer, P., Le Quéré, C., Luijkx, I. T., Peters, G. P., Peters, W., Pongratz, J., Schwingshackl, C., Sitch, S., Canadell, J. G., Ciais, P., Jackson, R. B., Alin, S. R., Anthoni, P., Barbero, L., Bates, N. R., Becker, M., Bellouin, N., Decharme, B., Bopp, L., Brasika, I. B. M., Cadule, P., Chamberlain, M. A., Chandra, N., Chau, T.-T.-T., Chevallier, F., Chini, L. P., Cronin, M., Dou, X., Enyo, K., Evans, W., Falk, S., Feely, R. A., Feng, L., Ford, D. J., Gasser, T., Ghattas, J., Gkritzalis, T., Grassi, G., Gregor, L., Gruber, N., Gürses, Ö., Harris, I., Hefner, M., Heinke, J., Houghton, R. A., Hurtt, G. C., Iida, Y., Ilyina, T., Jacobson, A. R., Jain, A., Jarníková, T., Jersild, A., Jiang, F., Jin, Z., Joos, F., Kato, E., Keeling, R. F., Kennedy, D., Klein Goldewijk, K., Knauer, J., Korsbakken, J. I., Körtzinger, A., Lan, X., Lefèvre, N., Li, H., Liu, J., Liu, Z., Ma, L., Marland, G., Mayot, N., McGuire, P. C., McKinley, G. A., Meyer, G., Morgan, E. J., Munro, D. R., Nakaoka, S.-I., Niwa, Y., O'Brien, K. M., Olsen, A., Omar, A. M., Ono, T., Paulsen, M., Pierrot, D., Pocock, K., Poulter, B., Powis, C. M., Rehder, G., Resplandy, L., Robertson, E., Rödenbeck, C., Rosan, T. M., Schwinger, J., Séférian, R., Smallman, T. L., Smith, S. M., Sospedra-Alfonso, R., Sun, Q., Sutton, A. J., Sweeney, C., Takao, S., Tans, P. P., Tian, H., Tilbrook, B., Tsujino, H., Tubiello, F., van der Werf, G. R., van Ooijen, E., Wanninkhof, R., Watanabe, M., Wimart-Rousseau, C., Yang, D., Yang, X., Yuan, W., Yue, X., Zaehle, S., Zeng, J., and Zheng, B.: Global Carbon Budget 2023, Earth Syst. Sci. Data, 15, 5301–5369, <ext-link xlink:href="https://doi.org/10.5194/essd-15-5301-2023" ext-link-type="DOI">10.5194/essd-15-5301-2023</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib17"><label>17</label><mixed-citation>Fu, Z., Hu, L., Chen, Z., Zhang, F., Shi, Z., Hu, B., Du, Z., and Liu, R.: Estimating spatial and temporal variation in ocean surface <inline-formula><mml:math id="M750" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the Gulf of Mexico using remote sensing and machine learning techniques, Sci. Total Environ., 745, 140965, <ext-link xlink:href="https://doi.org/10.1016/j.scitotenv.2020.140965" ext-link-type="DOI">10.1016/j.scitotenv.2020.140965</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib18"><label>18</label><mixed-citation>Gloege, L., Yan, M., Zheng, T., and McKinley, G. A.: Improved Quantification of Ocean Carbon Uptake by Using Machine Learning to Merge Global Models and <inline-formula><mml:math id="M752" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> Data, J. Adv. Model. Earth Sy., 14, e2021MS002620, <ext-link xlink:href="https://doi.org/10.1029/2021MS002620" ext-link-type="DOI">10.1029/2021MS002620</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib19"><label>19</label><mixed-citation>Gregor, L. and Gruber, N.: OceanSODA-ETHZ: a global gridded data set of the surface ocean carbonate system for seasonal to decadal studies of ocean acidification, Earth Syst. Sci. Data, 13, 777–808, <ext-link xlink:href="https://doi.org/10.5194/essd-13-777-2021" ext-link-type="DOI">10.5194/essd-13-777-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib20"><label>20</label><mixed-citation>Hersbach, H., Bell, B., Berrisford, P., Biavati, G., Horányi, A., Muñoz Sabater, J., Nicolas, J., Peubey, C., Radu, R., Rozum, I., and others: ERA5 monthly averaged data on single levels from 1979 to present, Copernicus Climate Change Service (C3S) Climate Data Store (CDS), 10, 252–266, <ext-link xlink:href="https://doi.org/10.24381/cds.f17050d7" ext-link-type="DOI">10.24381/cds.f17050d7</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib21"><label>21</label><mixed-citation>Huang, B., Liu, C., Banzon, V., Freeman, E., Graham, G., Hankins, B., Smith, T., and Zhang, H.-M.: Improvements of the Daily Optimum Interpolation Sea Surface Temperature (DOISST) Version 2.1, J. Climate, 34, 2923–2939, <ext-link xlink:href="https://doi.org/10.1175/JCLI-D-20-0166.1" ext-link-type="DOI">10.1175/JCLI-D-20-0166.1</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib22"><label>22</label><mixed-citation>Hughes, I. and Hase, T. P. A.: Measurements and their uncertainties: a practical guide to modern error analysis,  Oxford University Press, New York, 136 pp., ISBN 978-0-19-956632-7, 978-0-19-956633-4, 2010.</mixed-citation></ref>
      <ref id="bib1.bib23"><label>23</label><mixed-citation>Iida, Y., Takatani, Y., Kojima, A., and Ishii, M.: Global trends of ocean CO2 sink and ocean acidification: an observation-based reconstruction of surface ocean inorganic carbon variables, J. Oceanogr., 77, 323–358, <ext-link xlink:href="https://doi.org/10.1007/s10872-020-00571-5" ext-link-type="DOI">10.1007/s10872-020-00571-5</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib24"><label>24</label><mixed-citation>Kealoha, A. K., Shamberger, K. E. F., DiMarco, S. F., Thyng, K. M., Hetland, R. D., Manzello, D. P., Slowey, N. C., and Enochs, I. C.: Surface Water CO<sub>2</sub> variability in the Gulf of Mexico (1996–2017), Sci. Rep., 10, 12279, <ext-link xlink:href="https://doi.org/10.1038/s41598-020-68924-0" ext-link-type="DOI">10.1038/s41598-020-68924-0</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib25"><label>25</label><mixed-citation>Lan, X., Tans, P., Thoning, K., and NOAA Global Monitoring Laboratory: NOAA Greenhouse Gas Marine Boundary Layer Reference – CO<sub>2</sub>, NOAA GML [data set], <ext-link xlink:href="https://doi.org/10.15138/DVNP-F961" ext-link-type="DOI">10.15138/DVNP-F961</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib26"><label>26</label><mixed-citation>Landschützer, P., Gruber, N., Bakker, D. C. E., and Schuster, U.: Recent variability of the global ocean carbon sink, Global Biogeochem. Cy., 28, 927–949, <ext-link xlink:href="https://doi.org/10.1002/2014GB004853" ext-link-type="DOI">10.1002/2014GB004853</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib27"><label>27</label><mixed-citation>Landschützer, P., Gruber, N., and Bakker, D. C. E.: An observation-based global monthly gridded sea surface <inline-formula><mml:math id="M756" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product from 1982 onward and its monthly climatology (NCEI Accession 0160558), NOAA National Centers for Environmental Information [data set], <ext-link xlink:href="https://doi.org/10.7289/V5Z899N6" ext-link-type="DOI">10.7289/V5Z899N6</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib28"><label>28</label><mixed-citation>Landschützer, P., Laruelle, G. G., Roobaert, A., and Regnier, P.: A uniform <inline-formula><mml:math id="M758" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> climatology combining open and coastal oceans, Earth Syst. Sci. Data, 12, 2537–2553, <ext-link xlink:href="https://doi.org/10.5194/essd-12-2537-2020" ext-link-type="DOI">10.5194/essd-12-2537-2020</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib29"><label>29</label><mixed-citation>Laruelle, G. G., Landschützer, P., Gruber, N., Tison, J.-L., Delille, B., and Regnier, P.: Global high-resolution monthly <inline-formula><mml:math id="M760" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> climatology for the coastal ocean derived from neural network interpolation, Biogeosciences, 14, 4545–4561, <ext-link xlink:href="https://doi.org/10.5194/bg-14-4545-2017" ext-link-type="DOI">10.5194/bg-14-4545-2017</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib30"><label>30</label><mixed-citation>Laruelle, G. G., Cai, W.-J., Hu, X., Gruber, N., Mackenzie, F. T., and Regnier, P.: Continental shelves as a variable but increasing global sink for atmospheric carbon dioxide, Nat. Commun., 9, 454, <ext-link xlink:href="https://doi.org/10.1038/s41467-017-02738-z" ext-link-type="DOI">10.1038/s41467-017-02738-z</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib31"><label>31</label><mixed-citation>Lavoie, D., Lambert, N., Starr, M., Chassé, J., Riche, O., Le Clainche, Y., Azetsu-Scott, K., Béjaoui, B., Christian, J. R., and Gilbert, D.: The Gulf of St. Lawrence Biogeochemical Model: A Modelling Tool for Fisheries and Ocean Management, Front. Mar. Sci., 8, 732269, <ext-link xlink:href="https://doi.org/10.3389/fmars.2021.732269" ext-link-type="DOI">10.3389/fmars.2021.732269</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib32"><label>32</label><mixed-citation>Lohrenz, S. E. and Cai, W.-J.: Satellite ocean color assessment of air-sea fluxes of CO<sub>2</sub> in a river-dominated coastal margin: CO<sub>2</sub> FLUXES in a River-Dominated Margin, Geophys. Res. Lett., 33, L01601, <ext-link xlink:href="https://doi.org/10.1029/2005GL023942" ext-link-type="DOI">10.1029/2005GL023942</ext-link>, 2006.</mixed-citation></ref>
      <ref id="bib1.bib33"><label>33</label><mixed-citation>Lu, W., Su, H., Yang, X., and Yan, X.-H.: Subsurface temperature estimation from remote sensing data using a clustering-neural network method, Remote Sens. Environ., 229, 213–222, <ext-link xlink:href="https://doi.org/10.1016/j.rse.2019.04.009" ext-link-type="DOI">10.1016/j.rse.2019.04.009</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib34"><label>34</label><mixed-citation>McWilliams, J. C.: Submesoscale, coherent vortices in the ocean, Rev. Geophys., 23, 165–182, <ext-link xlink:href="https://doi.org/10.1029/RG023i002p00165" ext-link-type="DOI">10.1029/RG023i002p00165</ext-link>, 1985.</mixed-citation></ref>
      <ref id="bib1.bib35"><label>35</label><mixed-citation>O'Reilly, J. E., Maritorena, S., Mitchell, B. G., Siegel, D. A., Carder, K. L., Garver, S. A., Kahru, M., and McClain, C.: Ocean color chlorophyll algorithms for SeaWiFS, J. Geophys. Res., 103, 24937–24953, <ext-link xlink:href="https://doi.org/10.1029/98JC02160" ext-link-type="DOI">10.1029/98JC02160</ext-link>, 1998.</mixed-citation></ref>
      <ref id="bib1.bib36"><label>36</label><mixed-citation>Ren, H., Lu, W., Xiao, W., Zhu, Q., Xiao, C., and Lai, Z.: Intraseasonal response of marine planktonic ecosystem to summertime Madden-Julian Oscillation in the South China Sea: A model study, Prog. Oceanogr., 224, 103251, <ext-link xlink:href="https://doi.org/10.1016/j.pocean.2024.103251" ext-link-type="DOI">10.1016/j.pocean.2024.103251</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib37"><label>37</label><mixed-citation>Robbins, L. L., Daly, K. L., Barbero, L., Wanninkhof, R., He, R., Zong, H., Lisle, J. T., Cai, W. -J., and Smith, C. G.: Spatial and Temporal Variability of <inline-formula><mml:math id="M764" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub>, Carbon Fluxes, and Saturation State on the West Florida Shelf, J. Geophys. Res.-Oceans, 123, 6174–6188, <ext-link xlink:href="https://doi.org/10.1029/2018JC014195" ext-link-type="DOI">10.1029/2018JC014195</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib38"><label>38</label><mixed-citation>Rödenbeck, C., DeVries, T., Hauck, J., Le Quéré, C., and Keeling, R. F.: Data-based estimates of interannual sea–air CO<sub>2</sub> flux variations 1957–2020 and their relation to environmental drivers, Biogeosciences, 19, 2627–2652, <ext-link xlink:href="https://doi.org/10.5194/bg-19-2627-2022" ext-link-type="DOI">10.5194/bg-19-2627-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib39"><label>39</label><mixed-citation>Roobaert, A., Resplandy, L., Laruelle, G. G., Liao, E., and Regnier, P.: A framework to evaluate and elucidate the driving mechanisms of coastal sea surface <inline-formula><mml:math id="M767" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> seasonality using an ocean general circulation model (MOM6-COBALT), Ocean Sci., 18, 67–88, <ext-link xlink:href="https://doi.org/10.5194/os-18-67-2022" ext-link-type="DOI">10.5194/os-18-67-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib40"><label>40</label><mixed-citation>Roobaert, A., Regnier, P., Landschützer, P., and Laruelle, G. G.: A novel sea surface pCO2-product for the global coastal ocean resolving trends over 1982–2020, Earth Syst. Sci. Data, 16, 421–441, <ext-link xlink:href="https://doi.org/10.5194/essd-16-421-2024" ext-link-type="DOI">10.5194/essd-16-421-2024</ext-link>, 2024a.</mixed-citation></ref>
      <ref id="bib1.bib41"><label>41</label><mixed-citation>Roobaert, A., Resplandy, L., Laruelle, G. G., Liao, E., and Regnier, P.: Unraveling the Physical and Biological Controls of the Global Coastal CO<sub>2</sub> Sink, Global Biogeochem. Cy., 38, e2023GB007799, <ext-link xlink:href="https://doi.org/10.1029/2023GB007799" ext-link-type="DOI">10.1029/2023GB007799</ext-link>, 2024b.</mixed-citation></ref>
      <ref id="bib1.bib42"><label>42</label><mixed-citation>Ross, A. C., Stock, C. A., Adcroft, A., Curchitser, E., Hallberg, R., Harrison, M. J., Hedstrom, K., Zadeh, N., Alexander, M., Chen, W., Drenkard, E. J., du Pontavice, H., Dussin, R., Gomez, F., John, J. G., Kang, D., Lavoie, D., Resplandy, L., Roobaert, A., Saba, V., Shin, S.-I., Siedlecki, S., and Simkins, J.: A high-resolution physical–biogeochemical model for marine resource applications in the northwest Atlantic (MOM6-COBALT-NWA12 v1.0), Geosci. Model Dev., 16, 6943–6985, <ext-link xlink:href="https://doi.org/10.5194/gmd-16-6943-2023" ext-link-type="DOI">10.5194/gmd-16-6943-2023</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib43"><label>43</label><mixed-citation>Rutherford, K., Fennel, K., Atamanchuk, D., Wallace, D., and Thomas, H.: A modelling study of temporal and spatial <inline-formula><mml:math id="M770" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> variability on the biologically active and temperature-dominated Scotian Shelf, Biogeosciences, 18, 6271–6286, <ext-link xlink:href="https://doi.org/10.5194/bg-18-6271-2021" ext-link-type="DOI">10.5194/bg-18-6271-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib44"><label>44</label><mixed-citation>Salisbury, J. E. and Jönsson, B. F.: Rapid warming and salinity changes in the Gulf of Maine alter surface ocean carbonate parameters and hide ocean acidification, Biogeochemistry, 141, 401–418, <ext-link xlink:href="https://doi.org/10.1007/s10533-018-0505-3" ext-link-type="DOI">10.1007/s10533-018-0505-3</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib45"><label>45</label><mixed-citation>Sharp, J. D., Fassbender, A. J., Carter, B. R., Lavin, P. D., and Sutton, A. J.: A monthly surface <inline-formula><mml:math id="M772" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> product for the California Current Large Marine Ecosystem, Earth Syst. Sci. Data, 14, 2081–2108, <ext-link xlink:href="https://doi.org/10.5194/essd-14-2081-2022" ext-link-type="DOI">10.5194/essd-14-2081-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib46"><label>46</label><mixed-citation>Signorini, S. R., Mannino, A., Najjar, R. G., Friedrichs, M. A. M., Cai, W.-J., Salisbury, J., Wang, Z. A., Thomas, H., and Shadwick, E.: Surface ocean <inline-formula><mml:math id="M774" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> seasonality and sea-air CO<sub>2</sub> flux estimates for the North American east coast, J. Geophys. Res.-Oceans, 118, 5439–5460, <ext-link xlink:href="https://doi.org/10.1002/jgrc.20369" ext-link-type="DOI">10.1002/jgrc.20369</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib47"><label>47</label><mixed-citation>Song, L., Lee, Z., Shang, S., Huang, B., Wu, J., Wu, Z., Lu, W., and Liu, X.: On the spatial and temporal variations of primary production in the South China Sea, IEEE T. Geosci. Remote, 61, 4201514, <ext-link xlink:href="https://doi.org/10.1109/TGRS.2023.3241209" ext-link-type="DOI">10.1109/TGRS.2023.3241209</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib48"><label>48</label><mixed-citation>Su, H., Zhang, H., Geng, X., Qin, T., Lu, W., and Yan, X.-H.: OPEN: A New Estimation of Global Ocean Heat Content for Upper 2000 Meters from Remote Sensing Data, Remote Sensing, 12, 2294, <ext-link xlink:href="https://doi.org/10.3390/rs12142294" ext-link-type="DOI">10.3390/rs12142294</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib49"><label>49</label><mixed-citation>Sutton, A. J., Battisti, R., Carter, B., Evans, W., Newton, J., Alin, S., Bates, N. R., Cai, W.-J., Currie, K., Feely, R. A., Sabine, C., Tanhua, T., Tilbrook, B., and Wanninkhof, R.: Advancing best practices for assessing trends of ocean acidification time series, Front. Mar. Sci., 9, 1045667, <ext-link xlink:href="https://doi.org/10.3389/fmars.2022.1045667" ext-link-type="DOI">10.3389/fmars.2022.1045667</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib50"><label>50</label><mixed-citation>Takahashi, T., Sutherland, S. C., and Kozyr, A.: Global Ocean Surface Water Partial Pressure of CO2 Database: Measurements Performed During 1957–2019 (LDEO Database Version 2019) (NCEI Accession 0160492). Version 9.9, NOAA National Centers for Environmental Information [data set], <ext-link xlink:href="https://doi.org/10.3334/CDIAC/OTG.NDP088(V2015)" ext-link-type="DOI">10.3334/CDIAC/OTG.NDP088(V2015)</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib51"><label>51</label><mixed-citation>Taylor, J. R.: An introduction to error analysis: the study of uncertainties in physical measurements, 2nd edn., University Science Books, Sausalito, Calif, 327 pp., ISBN 978-0-935702-42-2, 978-0-935702-75-0, 1997.</mixed-citation></ref>
      <ref id="bib1.bib52"><label>52</label><mixed-citation>Vandemark, D., Salisbury, J. E., Hunt, C. W., Shellito, S. M., Irish, J. D., McGillis, W. R., Sabine, C. L., and Maenner, S. M.: Temporal and spatial dynamics of CO<sub>2</sub> air-sea flux in the Gulf of Maine, J. Geophys. Res., 116, C01012, <ext-link xlink:href="https://doi.org/10.1029/2010JC006408" ext-link-type="DOI">10.1029/2010JC006408</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib53"><label>53</label><mixed-citation>Wang, T., Yu, P., Wu, Z., Lu, W., Liu, X., Li, Q. P., and Huang, B.: Revisiting the Intraseasonal Variability of Chlorophyll-a in the Adjacent Luzon Strait With a New Gap-Filled Remote Sensing Data Set, IEEE T. Geosci. Remote, 60, 4201311, <ext-link xlink:href="https://doi.org/10.1109/TGRS.2021.3067646" ext-link-type="DOI">10.1109/TGRS.2021.3067646</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib54"><label>54</label><mixed-citation>Wang, Y., Wu, Z., Lu, W., Yu, S., Li, S., Meng, L., Geng, X., and Yan, X.-H.: Remote sensing estimations of the seawater partial pressure of CO<sub>2</sub> using sea surface roughness derived from Synthetic Aperture Radar, IEEE T. Geosci. Remote, 62,  4204913, <ext-link xlink:href="https://doi.org/10.1109/TGRS.2024.3379984" ext-link-type="DOI">10.1109/TGRS.2024.3379984</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib55"><label>55</label><mixed-citation>Wang, Z., Wang, G., Guo, X., Bai, Y., Xu, Y., and Dai, M.: Spatial reconstruction of long-term (2003–2020) sea surface <inline-formula><mml:math id="M779" display="inline"><mml:mi>p</mml:mi></mml:math></inline-formula>CO<sub>2</sub> in the South China Sea using a machine-learning-based regression method aided by empirical orthogonal function analysis, Earth Syst. Sci. Data, 15, 1711–1731, <ext-link xlink:href="https://doi.org/10.5194/essd-15-1711-2023" ext-link-type="DOI">10.5194/essd-15-1711-2023</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib56"><label>56</label><mixed-citation>Wang, Z. A., Bienvenu, D. J., Mann, P. J., Hoering, K. A., Poulsen, J. R., Spencer, R. G. M., and Holmes, R. M.: Inorganic carbon speciation and fluxes in the Congo River: The Congo River Inorganic Carbon System, Geophys. Res. Lett., 40, 511–516, <ext-link xlink:href="https://doi.org/10.1002/grl.50160" ext-link-type="DOI">10.1002/grl.50160</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib57"><label>57</label><mixed-citation>Wanninkhof, R., Barbero, L., Byrne, R., Cai, W.-J., Huang, W.-J., Zhang, J.-Z., Baringer, M., and Langdon, C.: Ocean acidification along the Gulf Coast and East Coast of the USA, Cont. Shelf Res., 98, 54–71, <ext-link xlink:href="https://doi.org/10.1016/j.csr.2015.02.008" ext-link-type="DOI">10.1016/j.csr.2015.02.008</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib58"><label>58</label><mixed-citation>Weiss, R. F. and Price, B. A.: Nitrous oxide solubility in water and seawater, Mar. Chem., 8, 347–359, <ext-link xlink:href="https://doi.org/10.1016/0304-4203(80)90024-9" ext-link-type="DOI">10.1016/0304-4203(80)90024-9</ext-link>, 1980.</mixed-citation></ref>
      <ref id="bib1.bib59"><label>59</label><mixed-citation>Wu, Z.: ReCAD, GitHub [code], <uri>https://github.com/zelunwu/ReCAD</uri>, last access: 1 December 2024.</mixed-citation></ref>
      <ref id="bib1.bib60"><label>60</label><mixed-citation>Wu, Z., Lu, W., Roobaert, A., Song, L., Yan, X.-H., and Cai, W.-J.: A Reconstructed Coastal Acidification Database (ReCAD) pCO2 data product for the North American Atlantic Coastal Ocean Margins (1.1), Zenodo [data set], <ext-link xlink:href="https://doi.org/10.5281/zenodo.14038561" ext-link-type="DOI">10.5281/zenodo.14038561</ext-link>, 2024a.</mixed-citation></ref>
      <ref id="bib1.bib61"><label>61</label><mixed-citation>Wu, Z., Wang, H., Liao, E., Hu, C., Edwing, K., Yan, X.-H., and Cai, W.-J.: Air-sea CO<sub>2</sub> flux in the Gulf of Mexico from observations and multiple machine-learning data products, Prog. Oceanogr., 223, 103244, <ext-link xlink:href="https://doi.org/10.1016/j.pocean.2024.103244" ext-link-type="DOI">10.1016/j.pocean.2024.103244</ext-link>, 2024b.</mixed-citation></ref>
      <ref id="bib1.bib62"><label>62</label><mixed-citation>Xu, Y., Cai, W., Wanninkhof, R., Salisbury, J., Reimer, J., and Chen, B.: Long-Term Changes of Carbonate Chemistry Variables Along the North American East Coast, J. Geophys. Res.-Oceans, 125, e2019JC015982, <ext-link xlink:href="https://doi.org/10.1029/2019JC015982" ext-link-type="DOI">10.1029/2019JC015982</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib63"><label>63</label><mixed-citation>Yang, G. G., Wang, Q., Feng, J., He, L., Li, R., Lu, W., Liao, E., and Lai, Z.: Can three-dimensional nitrate structure be reconstructed from surface information with artificial intelligence? – A proof-of-concept study, Sci. Total Environ., 924, 171365, <ext-link xlink:href="https://doi.org/10.1016/j.scitotenv.2024.171365" ext-link-type="DOI">10.1016/j.scitotenv.2024.171365</ext-link>, 2024. </mixed-citation></ref>
      <ref id="bib1.bib64"><label>64</label><mixed-citation>Zeng, J., Nojiri, Y., Landschützer, P., Telszewski, M., and Nakaoka, S.: A Global Surface Ocean <inline-formula><mml:math id="M782" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula>CO<sub>2</sub> Climatology Based on a Feed-Forward Neural Network, J. Atmos. Ocean. Tech., 31, 1838–1849, <ext-link xlink:href="https://doi.org/10.1175/JTECH-D-13-00137.1" ext-link-type="DOI">10.1175/JTECH-D-13-00137.1</ext-link>, 2014.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>A machine-learning reconstruction of sea surface <i>p</i>CO<sub>2</sub> in the North American Atlantic Coastal Ocean Margin from 1993 to 2021</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>1</label><mixed-citation>
      
Bakker, D. C. E., Pfeil, B., Landa, C. S., Metzl, N., O'Brien, K. M., Olsen, A., Smith, K., Cosca, C., Harasawa, S., Jones, S. D., Nakaoka, S., Nojiri, Y., Schuster, U., Steinhoff, T., Sweeney, C., Takahashi, T., Tilbrook, B., Wada, C., Wanninkhof, R., Alin, S. R., Balestrini, C. F., Barbero, L., Bates, N. R., Bianchi, A. A., Bonou, F., Boutin, J., Bozec, Y., Burger, E. F., Cai, W.-J., Castle, R. D., Chen, L., Chierici, M., Currie, K., Evans, W., Featherstone, C., Feely, R. A., Fransson, A., Goyet, C., Greenwood, N., Gregor, L., Hankin, S., Hardman-Mountford, N. J., Harlay, J., Hauck, J., Hoppema, M., Humphreys, M. P., Hunt, C. W., Huss, B., Ibánhez, J. S. P., Johannessen, T., Keeling, R., Kitidis, V., Körtzinger, A., Kozyr, A., Krasakopoulou, E., Kuwata, A., Landschützer, P., Lauvset, S. K., Lefèvre, N., Lo Monaco, C., Manke, A., Mathis, J. T., Merlivat, L., Millero, F. J., Monteiro, P. M. S., Munro, D. R., Murata, A., Newberger, T., Omar, A. M., Ono, T., Paterson, K., Pearce, D., Pierrot, D., Robbins, L. L., Saito, S., Salisbury, J., Schlitzer, R., Schneider, B., Schweitzer, R., Sieger, R., Skjelvan, I., Sullivan, K. F., Sutherland, S. C., Sutton, A. J., Tadokoro, K., Telszewski, M., Tuma, M., van Heuven, S. M. A. C., Vandemark, D., Ward, B., Watson, A. J., and Xu, S.: A multi-decade record of high-quality fCO2 data in version 3 of the Surface Ocean CO2 Atlas (SOCAT), Earth Syst. Sci. Data, 8, 383–413, <a href="https://doi.org/10.5194/essd-8-383-2016" target="_blank">https://doi.org/10.5194/essd-8-383-2016</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>2</label><mixed-citation>
      Breiman, L.: Random Forests, Machine Learning, 45, 5–32,
<a href="https://doi.org/10.1023/A:1010933404324" target="_blank">https://doi.org/10.1023/A:1010933404324</a>, 2001.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>3</label><mixed-citation>
      Cahill, B., Wilkin, J., Fennel, K., Vandemark, D., and Friedrichs, M. A. M.:
Interannual and seasonal variabilities in air-sea CO<sub>2</sub> fluxes along the
U.S. eastern continental shelf and their sensitivity to increasing air
temperatures and variable winds: U.S. East Coast Shelf Air-Sea CO<sub>2</sub>
Fluxes, J. Geophys. Res.-Biogeo., 121, 295–311,
<a href="https://doi.org/10.1002/2015JG002939" target="_blank">https://doi.org/10.1002/2015JG002939</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>4</label><mixed-citation>
      Cai, W.-J., Xu, Y.-Y., Feely, R. A., Wanninkhof, R., Jönsson, B., Alin,
S. R., Barbero, L., Cross, J. N., Azetsu-Scott, K., Fassbender, A. J.,
Carter, B. R., Jiang, L.-Q., Pepin, P., Chen, B., Hussain, N., Reimer, J.
J., Xue, L., Salisbury, J. E., Hernández-Ayón, J. M., Langdon, C.,
Li, Q., Sutton, A. J., Chen, C.-T. A., and Gledhill, D. K.: Controls on
surface water carbonate chemistry along North American ocean margins, Nat.
Commun., 11, 2691, <a href="https://doi.org/10.1038/s41467-020-16530-z" target="_blank">https://doi.org/10.1038/s41467-020-16530-z</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>5</label><mixed-citation>
      Carter, B. R., Feely, R. A., Williams, N. L., Dickson, A. G., Fong, M. B.,
and Takeshita, Y.: Updated methods for global locally interpolated
estimation of alkalinity, pH, and nitrate: LIR: Global alkalinity, pH, and
nitrate estimates, Limnol. Oceanogr. Methods, 16, 119–131,
<a href="https://doi.org/10.1002/lom3.10232" target="_blank">https://doi.org/10.1002/lom3.10232</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>6</label><mixed-citation>
      Carton, J. A., Chepurin, G. A., and Chen, L.: SODA3: A New Ocean Climate
Reanalysis, J. Climate, 31, 6967–6983,
<a href="https://doi.org/10.1175/JCLI-D-18-0149.1" target="_blank">https://doi.org/10.1175/JCLI-D-18-0149.1</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>7</label><mixed-citation>
      Chau, T. T. T., Gehlen, M., and Chevallier, F.: A seamless ensemble-based reconstruction of surface ocean <i>p</i>CO<sub>2</sub> and air–sea CO<sub>2</sub> fluxes over the global coastal and open oceans, Biogeosciences, 19, 1087–1109, <a href="https://doi.org/10.5194/bg-19-1087-2022" target="_blank">https://doi.org/10.5194/bg-19-1087-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>8</label><mixed-citation>
       Chen, C.-T. A., Huang, T.-H., Chen, Y.-C., Bai, Y., He, X., and Kang, Y.: Air–sea exchanges of CO<sub>2</sub> in the world's coastal seas, Biogeosciences, 10, 6509–6544, <a href="https://doi.org/10.5194/bg-10-6509-2013" target="_blank">https://doi.org/10.5194/bg-10-6509-2013</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>9</label><mixed-citation>
      Chen, S. and Hu, C.: Environmental controls of surface water <i>p</i>CO<sub>2</sub> in
different coastal environments: Observations from marine buoys, Cont.
Shelf Res., 183, 73–86, <a href="https://doi.org/10.1016/j.csr.2019.06.007" target="_blank">https://doi.org/10.1016/j.csr.2019.06.007</a>,
2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>10</label><mixed-citation>
      E.U. Copernicus Marine Service Information (CMEMS): Global Ocean Gridded L4 Sea
Surface Heights and Derived Variables Reprocessed (1993–ongoing), [data set],
<a href="https://doi.org/10.48670/moi-00148" target="_blank">https://doi.org/10.48670/moi-00148</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>11</label><mixed-citation>
      Dai, M., Su, J., Zhao, Y., Hofmann, E. E., Cao, Z., Cai, W.-J., Gan, J.,
Lacroix, F., Laruelle, G. G., Meng, F., Müller, J. D., Regnier, P. A.
G., Wang, G., and Wang, Z.: Carbon Fluxes in the Coastal Ocean: Synthesis,
Boundary Processes and Future Trends, Annu. Rev. Earth Planet. Sci., 50,
593–626,
<a href="https://doi.org/10.1146/annurev-earth-032320-090746" target="_blank">https://doi.org/10.1146/annurev-earth-032320-090746</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>12</label><mixed-citation>
      Fay, A. R., Gregor, L., Landschützer, P., McKinley, G. A., Gruber, N., Gehlen, M., Iida, Y., Laruelle, G. G., Rödenbeck, C., Roobaert, A., and Zeng, J.: SeaFlux: harmonization of air–sea CO<sub>2</sub> fluxes from surface <i>p</i>CO<sub>2</sub> data products using a standardized approach, Earth Syst. Sci. Data, 13, 4693–4710, <a href="https://doi.org/10.5194/essd-13-4693-2021" target="_blank">https://doi.org/10.5194/essd-13-4693-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>13</label><mixed-citation>
      Fennel, K. and Wilkin, J.: Quantifying biological carbon export for the
northwest North Atlantic continental shelves, Geophys. Res. Lett.,
36, L18605, <a href="https://doi.org/10.1029/2009GL039818" target="_blank">https://doi.org/10.1029/2009GL039818</a>, 2009.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>14</label><mixed-citation>
      Fennel, K., Alin, S., Barbero, L., Evans, W., Bourgeois, T., Cooley, S., Dunne, J., Feely, R. A., Hernandez-Ayon, J. M., Hu, X., Lohrenz, S., Muller-Karger, F., Najjar, R., Robbins, L., Shadwick, E., Siedlecki, S., Steiner, N., Sutton, A., Turk, D., Vlahos, P., and Wang, Z. A.: Carbon cycling in the North American coastal ocean: a synthesis, Biogeosciences, 16, 1281–1304, <a href="https://doi.org/10.5194/bg-16-1281-2019" target="_blank">https://doi.org/10.5194/bg-16-1281-2019</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>15</label><mixed-citation>
      Ford, D. J., Blannin, J., Watts, J., Watson, A. J., Landschützer, P.,
Jersild, A., and Shutler, J. D.: A Comprehensive Analysis of Air-Sea
CO<sub>2</sub> Flux Uncertainties Constructed From Surface Ocean Data Products,
Global Biogeochem. Cy., 38, e2024GB008188,
<a href="https://doi.org/10.1029/2024GB008188" target="_blank">https://doi.org/10.1029/2024GB008188</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>16</label><mixed-citation>
      Friedlingstein, P., O'Sullivan, M., Jones, M. W., Andrew, R. M., Bakker, D. C. E., Hauck, J., Landschützer, P., Le Quéré, C., Luijkx, I. T., Peters, G. P., Peters, W., Pongratz, J., Schwingshackl, C., Sitch, S., Canadell, J. G., Ciais, P., Jackson, R. B., Alin, S. R., Anthoni, P., Barbero, L., Bates, N. R., Becker, M., Bellouin, N., Decharme, B., Bopp, L., Brasika, I. B. M., Cadule, P., Chamberlain, M. A., Chandra, N., Chau, T.-T.-T., Chevallier, F., Chini, L. P., Cronin, M., Dou, X., Enyo, K., Evans, W., Falk, S., Feely, R. A., Feng, L., Ford, D. J., Gasser, T., Ghattas, J., Gkritzalis, T., Grassi, G., Gregor, L., Gruber, N., Gürses, Ö., Harris, I., Hefner, M., Heinke, J., Houghton, R. A., Hurtt, G. C., Iida, Y., Ilyina, T., Jacobson, A. R., Jain, A., Jarníková, T., Jersild, A., Jiang, F., Jin, Z., Joos, F., Kato, E., Keeling, R. F., Kennedy, D., Klein Goldewijk, K., Knauer, J., Korsbakken, J. I., Körtzinger, A., Lan, X., Lefèvre, N., Li, H., Liu, J., Liu, Z., Ma, L., Marland, G., Mayot, N., McGuire, P. C., McKinley, G. A., Meyer, G., Morgan, E. J., Munro, D. R., Nakaoka, S.-I., Niwa, Y., O'Brien, K. M., Olsen, A., Omar, A. M., Ono, T., Paulsen, M., Pierrot, D., Pocock, K., Poulter, B., Powis, C. M., Rehder, G., Resplandy, L., Robertson, E., Rödenbeck, C., Rosan, T. M., Schwinger, J., Séférian, R., Smallman, T. L., Smith, S. M., Sospedra-Alfonso, R., Sun, Q., Sutton, A. J., Sweeney, C., Takao, S., Tans, P. P., Tian, H., Tilbrook, B., Tsujino, H., Tubiello, F., van der Werf, G. R., van Ooijen, E., Wanninkhof, R., Watanabe, M., Wimart-Rousseau, C., Yang, D., Yang, X., Yuan, W., Yue, X., Zaehle, S., Zeng, J., and Zheng, B.: Global Carbon Budget 2023, Earth Syst. Sci. Data, 15, 5301–5369, <a href="https://doi.org/10.5194/essd-15-5301-2023" target="_blank">https://doi.org/10.5194/essd-15-5301-2023</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>17</label><mixed-citation>
      Fu, Z., Hu, L., Chen, Z., Zhang, F., Shi, Z., Hu, B., Du, Z., and Liu, R.:
Estimating spatial and temporal variation in ocean surface <i>p</i>CO<sub>2</sub> in the Gulf
of Mexico using remote sensing and machine learning techniques, Sci. Total Environ., 745, 140965,
<a href="https://doi.org/10.1016/j.scitotenv.2020.140965" target="_blank">https://doi.org/10.1016/j.scitotenv.2020.140965</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>18</label><mixed-citation>
      Gloege, L., Yan, M., Zheng, T., and McKinley, G. A.: Improved Quantification
of Ocean Carbon Uptake by Using Machine Learning to Merge Global Models and
<i>p</i>CO<sub>2</sub> Data, J. Adv. Model. Earth Sy., 14, e2021MS002620,
<a href="https://doi.org/10.1029/2021MS002620" target="_blank">https://doi.org/10.1029/2021MS002620</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>19</label><mixed-citation>
      Gregor, L. and Gruber, N.: OceanSODA-ETHZ: a global gridded data set of the surface ocean carbonate system for seasonal to decadal studies of ocean acidification, Earth Syst. Sci. Data, 13, 777–808, <a href="https://doi.org/10.5194/essd-13-777-2021" target="_blank">https://doi.org/10.5194/essd-13-777-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>20</label><mixed-citation>
      Hersbach, H., Bell, B., Berrisford, P., Biavati, G., Horányi, A.,
Muñoz Sabater, J., Nicolas, J., Peubey, C., Radu, R., Rozum, I., and
others: ERA5 monthly averaged data on single levels from 1979 to present,
Copernicus Climate Change Service (C3S) Climate Data Store (CDS), 10,
252–266, <a href="https://doi.org/10.24381/cds.f17050d7" target="_blank">https://doi.org/10.24381/cds.f17050d7</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>21</label><mixed-citation>
      Huang, B., Liu, C., Banzon, V., Freeman, E., Graham, G., Hankins, B., Smith,
T., and Zhang, H.-M.: Improvements of the Daily Optimum Interpolation Sea
Surface Temperature (DOISST) Version 2.1, J. Climate, 34,
2923–2939, <a href="https://doi.org/10.1175/JCLI-D-20-0166.1" target="_blank">https://doi.org/10.1175/JCLI-D-20-0166.1</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>22</label><mixed-citation>
      Hughes, I. and Hase, T. P. A.: Measurements and their uncertainties: a
practical guide to modern error analysis,  Oxford University
Press, New York, 136 pp., ISBN
978-0-19-956632-7,
978-0-19-956633-4, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>23</label><mixed-citation>
      Iida, Y., Takatani, Y., Kojima, A., and Ishii, M.: Global trends of ocean
CO2 sink and ocean acidification: an observation-based reconstruction of
surface ocean inorganic carbon variables, J. Oceanogr., 77, 323–358,
<a href="https://doi.org/10.1007/s10872-020-00571-5" target="_blank">https://doi.org/10.1007/s10872-020-00571-5</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>24</label><mixed-citation>
      Kealoha, A. K., Shamberger, K. E. F., DiMarco, S. F., Thyng, K. M., Hetland,
R. D., Manzello, D. P., Slowey, N. C., and Enochs, I. C.: Surface Water
CO<sub>2</sub> variability in the Gulf of Mexico (1996–2017), Sci. Rep., 10, 12279,
<a href="https://doi.org/10.1038/s41598-020-68924-0" target="_blank">https://doi.org/10.1038/s41598-020-68924-0</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>25</label><mixed-citation>
      Lan, X., Tans, P., Thoning, K., and NOAA Global Monitoring Laboratory: NOAA Greenhouse Gas Marine Boundary Layer Reference – CO<sub>2</sub>, NOAA GML [data set], <a href="https://doi.org/10.15138/DVNP-F961" target="_blank">https://doi.org/10.15138/DVNP-F961</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>26</label><mixed-citation>
      Landschützer, P., Gruber, N., Bakker, D. C. E., and Schuster, U.: Recent
variability of the global ocean carbon sink, Global Biogeochem. Cy.,
28, 927–949, <a href="https://doi.org/10.1002/2014GB004853" target="_blank">https://doi.org/10.1002/2014GB004853</a>, 2014.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>27</label><mixed-citation>
      Landschützer, P., Gruber, N., and Bakker, D. C. E.: An observation-based
global monthly gridded sea surface <i>p</i>CO<sub>2</sub> product from 1982 onward and its
monthly climatology (NCEI Accession 0160558), NOAA National Centers for Environmental Information [data set],
<a href="https://doi.org/10.7289/V5Z899N6" target="_blank">https://doi.org/10.7289/V5Z899N6</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>28</label><mixed-citation>
      Landschützer, P., Laruelle, G. G., Roobaert, A., and Regnier, P.: A uniform <i>p</i>CO<sub>2</sub> climatology combining open and coastal oceans, Earth Syst. Sci. Data, 12, 2537–2553, <a href="https://doi.org/10.5194/essd-12-2537-2020" target="_blank">https://doi.org/10.5194/essd-12-2537-2020</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>29</label><mixed-citation>
      Laruelle, G. G., Landschützer, P., Gruber, N., Tison, J.-L., Delille, B., and Regnier, P.: Global high-resolution monthly <i>p</i>CO<sub>2</sub> climatology for the coastal ocean derived from neural network interpolation, Biogeosciences, 14, 4545–4561, <a href="https://doi.org/10.5194/bg-14-4545-2017" target="_blank">https://doi.org/10.5194/bg-14-4545-2017</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>30</label><mixed-citation>
      Laruelle, G. G., Cai, W.-J., Hu, X., Gruber, N., Mackenzie, F. T., and
Regnier, P.: Continental shelves as a variable but increasing global sink
for atmospheric carbon dioxide, Nat. Commun., 9, 454,
<a href="https://doi.org/10.1038/s41467-017-02738-z" target="_blank">https://doi.org/10.1038/s41467-017-02738-z</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>31</label><mixed-citation>
      Lavoie, D., Lambert, N., Starr, M., Chassé, J., Riche, O., Le Clainche,
Y., Azetsu-Scott, K., Béjaoui, B., Christian, J. R., and Gilbert, D.:
The Gulf of St. Lawrence Biogeochemical Model: A Modelling Tool for
Fisheries and Ocean Management, Front. Mar. Sci., 8, 732269,
<a href="https://doi.org/10.3389/fmars.2021.732269" target="_blank">https://doi.org/10.3389/fmars.2021.732269</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>32</label><mixed-citation>
      Lohrenz, S. E. and Cai, W.-J.: Satellite ocean color assessment of air-sea
fluxes of CO<sub>2</sub> in a river-dominated coastal margin: CO<sub>2</sub> FLUXES in a
River-Dominated Margin, Geophys. Res. Lett., 33, L01601,
<a href="https://doi.org/10.1029/2005GL023942" target="_blank">https://doi.org/10.1029/2005GL023942</a>, 2006.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>33</label><mixed-citation>
      Lu, W., Su, H., Yang, X., and Yan, X.-H.: Subsurface temperature estimation
from remote sensing data using a clustering-neural network method, Remote
Sens. Environ., 229, 213–222,
<a href="https://doi.org/10.1016/j.rse.2019.04.009" target="_blank">https://doi.org/10.1016/j.rse.2019.04.009</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>34</label><mixed-citation>
      McWilliams, J. C.: Submesoscale, coherent vortices in the ocean, Rev.
Geophys., 23, 165–182, <a href="https://doi.org/10.1029/RG023i002p00165" target="_blank">https://doi.org/10.1029/RG023i002p00165</a>, 1985.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>35</label><mixed-citation>
      O'Reilly, J. E., Maritorena, S., Mitchell, B. G., Siegel, D. A., Carder, K.
L., Garver, S. A., Kahru, M., and McClain, C.: Ocean color chlorophyll
algorithms for SeaWiFS, J. Geophys. Res., 103, 24937–24953,
<a href="https://doi.org/10.1029/98JC02160" target="_blank">https://doi.org/10.1029/98JC02160</a>, 1998.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>36</label><mixed-citation>
      Ren, H., Lu, W., Xiao, W., Zhu, Q., Xiao, C., and Lai, Z.: Intraseasonal
response of marine planktonic ecosystem to summertime Madden-Julian
Oscillation in the South China Sea: A model study, Prog. Oceanogr.,
224, 103251, <a href="https://doi.org/10.1016/j.pocean.2024.103251" target="_blank">https://doi.org/10.1016/j.pocean.2024.103251</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>37</label><mixed-citation>
      Robbins, L. L., Daly, K. L., Barbero, L., Wanninkhof, R., He, R., Zong, H.,
Lisle, J. T., Cai, W. -J., and Smith, C. G.: Spatial and Temporal
Variability of <i>p</i>CO<sub>2</sub>, Carbon Fluxes, and Saturation State on the West
Florida Shelf, J. Geophys. Res.-Oceans, 123, 6174–6188,
<a href="https://doi.org/10.1029/2018JC014195" target="_blank">https://doi.org/10.1029/2018JC014195</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>38</label><mixed-citation>
      Rödenbeck, C., DeVries, T., Hauck, J., Le Quéré, C., and Keeling, R. F.: Data-based estimates of interannual sea–air CO<sub>2</sub> flux variations 1957–2020 and their relation to environmental drivers, Biogeosciences, 19, 2627–2652, <a href="https://doi.org/10.5194/bg-19-2627-2022" target="_blank">https://doi.org/10.5194/bg-19-2627-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>39</label><mixed-citation>
      Roobaert, A., Resplandy, L., Laruelle, G. G., Liao, E., and Regnier, P.: A framework to evaluate and elucidate the driving mechanisms of coastal sea surface <i>p</i>CO<sub>2</sub> seasonality using an ocean general circulation model (MOM6-COBALT), Ocean Sci., 18, 67–88, <a href="https://doi.org/10.5194/os-18-67-2022" target="_blank">https://doi.org/10.5194/os-18-67-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>40</label><mixed-citation>
      Roobaert, A., Regnier, P., Landschützer, P., and Laruelle, G. G.: A novel sea surface pCO2-product for the global coastal ocean resolving trends over 1982–2020, Earth Syst. Sci. Data, 16, 421–441, <a href="https://doi.org/10.5194/essd-16-421-2024" target="_blank">https://doi.org/10.5194/essd-16-421-2024</a>, 2024a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>41</label><mixed-citation>
      Roobaert, A., Resplandy, L., Laruelle, G. G., Liao, E., and Regnier, P.:
Unraveling the Physical and Biological Controls of the Global Coastal
CO<sub>2</sub> Sink, Global Biogeochem. Cy., 38, e2023GB007799,
<a href="https://doi.org/10.1029/2023GB007799" target="_blank">https://doi.org/10.1029/2023GB007799</a>, 2024b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>42</label><mixed-citation>
      Ross, A. C., Stock, C. A., Adcroft, A., Curchitser, E., Hallberg, R., Harrison, M. J., Hedstrom, K., Zadeh, N., Alexander, M., Chen, W., Drenkard, E. J., du Pontavice, H., Dussin, R., Gomez, F., John, J. G., Kang, D., Lavoie, D., Resplandy, L., Roobaert, A., Saba, V., Shin, S.-I., Siedlecki, S., and Simkins, J.: A high-resolution physical–biogeochemical model for marine resource applications in the northwest Atlantic (MOM6-COBALT-NWA12 v1.0), Geosci. Model Dev., 16, 6943–6985, <a href="https://doi.org/10.5194/gmd-16-6943-2023" target="_blank">https://doi.org/10.5194/gmd-16-6943-2023</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>43</label><mixed-citation>
      Rutherford, K., Fennel, K., Atamanchuk, D., Wallace, D., and Thomas, H.: A modelling study of temporal and spatial <i>p</i>CO<sub>2</sub> variability on the biologically active and temperature-dominated Scotian Shelf, Biogeosciences, 18, 6271–6286, <a href="https://doi.org/10.5194/bg-18-6271-2021" target="_blank">https://doi.org/10.5194/bg-18-6271-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>44</label><mixed-citation>
      Salisbury, J. E. and Jönsson, B. F.: Rapid warming and salinity changes
in the Gulf of Maine alter surface ocean carbonate parameters and hide ocean
acidification, Biogeochemistry, 141, 401–418,
<a href="https://doi.org/10.1007/s10533-018-0505-3" target="_blank">https://doi.org/10.1007/s10533-018-0505-3</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>45</label><mixed-citation>
      Sharp, J. D., Fassbender, A. J., Carter, B. R., Lavin, P. D., and Sutton, A. J.: A monthly surface <i>p</i>CO<sub>2</sub> product for the California Current Large Marine Ecosystem, Earth Syst. Sci. Data, 14, 2081–2108, <a href="https://doi.org/10.5194/essd-14-2081-2022" target="_blank">https://doi.org/10.5194/essd-14-2081-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>46</label><mixed-citation>
      Signorini, S. R., Mannino, A., Najjar, R. G., Friedrichs, M. A. M., Cai,
W.-J., Salisbury, J., Wang, Z. A., Thomas, H., and Shadwick, E.: Surface
ocean <i>p</i>CO<sub>2</sub> seasonality and sea-air CO<sub>2</sub> flux estimates for the North
American east coast, J. Geophys. Res.-Oceans, 118, 5439–5460,
<a href="https://doi.org/10.1002/jgrc.20369" target="_blank">https://doi.org/10.1002/jgrc.20369</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>47</label><mixed-citation>
      Song, L., Lee, Z., Shang, S., Huang, B., Wu, J., Wu, Z., Lu, W., and Liu,
X.: On the spatial and temporal variations of primary production in the
South China Sea, IEEE T. Geosci. Remote, 61, 4201514,
<a href="https://doi.org/10.1109/TGRS.2023.3241209" target="_blank">https://doi.org/10.1109/TGRS.2023.3241209</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>48</label><mixed-citation>
      Su, H., Zhang, H., Geng, X., Qin, T., Lu, W., and Yan, X.-H.: OPEN: A New
Estimation of Global Ocean Heat Content for Upper 2000 Meters from Remote
Sensing Data, Remote Sensing, 12, 2294, <a href="https://doi.org/10.3390/rs12142294" target="_blank">https://doi.org/10.3390/rs12142294</a>,
2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>49</label><mixed-citation>
      Sutton, A. J., Battisti, R., Carter, B., Evans, W., Newton, J., Alin, S.,
Bates, N. R., Cai, W.-J., Currie, K., Feely, R. A., Sabine, C., Tanhua, T.,
Tilbrook, B., and Wanninkhof, R.: Advancing best practices for assessing
trends of ocean acidification time series, Front. Mar. Sci., 9, 1045667,
<a href="https://doi.org/10.3389/fmars.2022.1045667" target="_blank">https://doi.org/10.3389/fmars.2022.1045667</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>50</label><mixed-citation>
      Takahashi, T., Sutherland, S. C., and Kozyr, A.: Global Ocean Surface Water Partial Pressure of CO2 Database: Measurements Performed During 1957–2019 (LDEO Database Version 2019) (NCEI Accession 0160492). Version 9.9, NOAA National Centers for Environmental Information [data set], <a href="https://doi.org/10.3334/CDIAC/OTG.NDP088(V2015)" target="_blank">https://doi.org/10.3334/CDIAC/OTG.NDP088(V2015)</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib51"><label>51</label><mixed-citation>
      Taylor, J. R.: An introduction to error analysis: the study of uncertainties
in physical measurements, 2nd edn., University Science Books, Sausalito,
Calif, 327 pp., ISBN
978-0-935702-42-2,
978-0-935702-75-0, 1997.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib52"><label>52</label><mixed-citation>
      Vandemark, D., Salisbury, J. E., Hunt, C. W., Shellito, S. M., Irish, J. D.,
McGillis, W. R., Sabine, C. L., and Maenner, S. M.: Temporal and spatial
dynamics of CO<sub>2</sub> air-sea flux in the Gulf of Maine, J. Geophys. Res.,
116, C01012, <a href="https://doi.org/10.1029/2010JC006408" target="_blank">https://doi.org/10.1029/2010JC006408</a>, 2011.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib53"><label>53</label><mixed-citation>
      Wang, T., Yu, P., Wu, Z., Lu, W., Liu, X., Li, Q. P., and Huang, B.:
Revisiting the Intraseasonal Variability of Chlorophyll-a in the Adjacent
Luzon Strait With a New Gap-Filled Remote Sensing Data Set, IEEE T.
Geosci. Remote, 60, 4201311, <a href="https://doi.org/10.1109/TGRS.2021.3067646" target="_blank">https://doi.org/10.1109/TGRS.2021.3067646</a>,
2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib54"><label>54</label><mixed-citation>
      Wang, Y., Wu, Z., Lu, W., Yu, S., Li, S., Meng, L., Geng, X., and Yan,
X.-H.: Remote sensing estimations of the seawater partial pressure of
CO<sub>2</sub> using sea surface roughness derived from Synthetic Aperture Radar,
IEEE T. Geosci. Remote, 62,  4204913,
<a href="https://doi.org/10.1109/TGRS.2024.3379984" target="_blank">https://doi.org/10.1109/TGRS.2024.3379984</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib55"><label>55</label><mixed-citation>
      Wang, Z., Wang, G., Guo, X., Bai, Y., Xu, Y., and Dai, M.: Spatial reconstruction of long-term (2003–2020) sea surface <i>p</i>CO<sub>2</sub> in the South China Sea using a machine-learning-based regression method aided by empirical orthogonal function analysis, Earth Syst. Sci. Data, 15, 1711–1731, <a href="https://doi.org/10.5194/essd-15-1711-2023" target="_blank">https://doi.org/10.5194/essd-15-1711-2023</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib56"><label>56</label><mixed-citation>
      Wang, Z. A., Bienvenu, D. J., Mann, P. J., Hoering, K. A., Poulsen, J. R.,
Spencer, R. G. M., and Holmes, R. M.: Inorganic carbon speciation and fluxes
in the Congo River: The Congo River Inorganic Carbon System, Geophys. Res.
Lett., 40, 511–516, <a href="https://doi.org/10.1002/grl.50160" target="_blank">https://doi.org/10.1002/grl.50160</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib57"><label>57</label><mixed-citation>
      Wanninkhof, R., Barbero, L., Byrne, R., Cai, W.-J., Huang, W.-J., Zhang,
J.-Z., Baringer, M., and Langdon, C.: Ocean acidification along the Gulf
Coast and East Coast of the USA, Cont. Shelf Res., 98, 54–71,
<a href="https://doi.org/10.1016/j.csr.2015.02.008" target="_blank">https://doi.org/10.1016/j.csr.2015.02.008</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib58"><label>58</label><mixed-citation>
      Weiss, R. F. and Price, B. A.: Nitrous oxide solubility in water and
seawater, Mar. Chem., 8, 347–359,
<a href="https://doi.org/10.1016/0304-4203(80)90024-9" target="_blank">https://doi.org/10.1016/0304-4203(80)90024-9</a>, 1980.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib59"><label>59</label><mixed-citation>
      Wu, Z.: ReCAD, GitHub [code], <a href="https://github.com/zelunwu/ReCAD" target="_blank"/>, last access: 1 December 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib60"><label>60</label><mixed-citation>
      Wu, Z., Lu, W., Roobaert, A., Song, L., Yan, X.-H., and Cai, W.-J.: A Reconstructed Coastal Acidification Database (ReCAD) pCO2 data product for the North American Atlantic Coastal Ocean Margins (1.1), Zenodo [data set], <a href="https://doi.org/10.5281/zenodo.14038561" target="_blank">https://doi.org/10.5281/zenodo.14038561</a>,
2024a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib61"><label>61</label><mixed-citation>
      Wu, Z., Wang, H., Liao, E., Hu, C., Edwing, K., Yan, X.-H., and Cai, W.-J.:
Air-sea CO<sub>2</sub> flux in the Gulf of Mexico from observations and multiple
machine-learning data products, Prog. Oceanogr., 223, 103244,
<a href="https://doi.org/10.1016/j.pocean.2024.103244" target="_blank">https://doi.org/10.1016/j.pocean.2024.103244</a>, 2024b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib62"><label>62</label><mixed-citation>
      Xu, Y., Cai, W., Wanninkhof, R., Salisbury, J., Reimer, J., and Chen, B.:
Long-Term Changes of Carbonate Chemistry Variables Along the North American
East Coast, J. Geophys. Res.-Oceans, 125, e2019JC015982,
<a href="https://doi.org/10.1029/2019JC015982" target="_blank">https://doi.org/10.1029/2019JC015982</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib63"><label>63</label><mixed-citation>
      Yang, G. G., Wang, Q., Feng, J., He, L., Li, R., Lu, W., Liao, E., and Lai,
Z.: Can three-dimensional nitrate structure be reconstructed from surface
information with artificial intelligence? – A proof-of-concept study,
Sci. Total Environ., 924, 171365,
<a href="https://doi.org/10.1016/j.scitotenv.2024.171365" target="_blank">https://doi.org/10.1016/j.scitotenv.2024.171365</a>, 2024.


    </mixed-citation></ref-html>
<ref-html id="bib1.bib64"><label>64</label><mixed-citation>
      Zeng, J., Nojiri, Y., Landschützer, P., Telszewski, M., and Nakaoka, S.:
A Global Surface Ocean <i>f</i>CO<sub>2</sub> Climatology Based on a Feed-Forward Neural
Network, J. Atmos. Ocean. Tech., 31, 1838–1849,
<a href="https://doi.org/10.1175/JTECH-D-13-00137.1" target="_blank">https://doi.org/10.1175/JTECH-D-13-00137.1</a>, 2014.

    </mixed-citation></ref-html>--></article>
