<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="data-paper">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">ESSD</journal-id><journal-title-group>
    <journal-title>Earth System Science Data</journal-title>
    <abbrev-journal-title abbrev-type="publisher">ESSD</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Earth Syst. Sci. Data</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1866-3516</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/essd-18-3997-2026</article-id><title-group><article-title>CY-Bench: a comprehensive benchmark dataset for sub-national crop yield forecasting</article-title><alt-title>CY-Bench: a benchmark for crop yield forecasting</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" equal-contrib="yes" corresp="yes" rid="aff1">
          <name><surname>Kallenberg</surname><given-names>Michiel</given-names></name>
          <email>michiel.kallenberg@wur.nl</email>
        <ext-link>https://orcid.org/0000-0002-4661-6674</ext-link></contrib>
        <contrib contrib-type="author" equal-contrib="yes" corresp="no" rid="aff1">
          <name><surname>Paudel</surname><given-names>Dilli</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Ofori-Ampofo</surname><given-names>Stella</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Baja</surname><given-names>Hilmy</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-6995-3817</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>van Bree</surname><given-names>Ron</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Potze</surname><given-names>Aike</given-names></name>
          
        <ext-link>https://orcid.org/0009-0008-7812-3293</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3">
          <name><surname>Poudel</surname><given-names>Pratishtha</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4">
          <name><surname>Saleh</surname><given-names>Abdelrahman</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5">
          <name><surname>Anderson</surname><given-names>Weston</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>von Bloh</surname><given-names>Malte</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff6">
          <name><surname>Castellano</surname><given-names>Andres</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff7">
          <name><surname>Ennaji</surname><given-names>Oumnia</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff8">
          <name><surname>Hamed</surname><given-names>Raed</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-2243-3109</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff9">
          <name><surname>Laudien</surname><given-names>Rahel</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-5859-4030</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff10">
          <name><surname>Lee</surname><given-names>Donghoon</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff11">
          <name><surname>Luna</surname><given-names>Inti</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff12">
          <name><surname>Masiliūnas</surname><given-names>Dainius</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-5654-1277</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff13">
          <name><surname>Meroni</surname><given-names>Michele</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff14">
          <name><surname>Mutuku</surname><given-names>Janet Mumo</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff15">
          <name><surname>Mkuhlani</surname><given-names>Siyabusa</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff16">
          <name><surname>Richetti</surname><given-names>Jonathan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff6">
          <name><surname>Ruane</surname><given-names>Alex C.</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-5582-9217</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5">
          <name><surname>Sahajpal</surname><given-names>Ritvik</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-6418-289X</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5">
          <name><surname>Shuai</surname><given-names>Guanyuan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Sitokonstantinou</surname><given-names>Vasileios</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-5506-2872</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff17">
          <name><surname>Nóia-Júnior</surname><given-names>Rogério de S.</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff18">
          <name><surname>Srivastava</surname><given-names>Amit Kumar</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-8219-4854</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff19">
          <name><surname>Strong</surname><given-names>Robert</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-5279-4808</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff20">
          <name><surname>Sweet</surname><given-names>Lily-belle</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-9971-6102</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff21">
          <name><surname>Vojnović</surname><given-names>Petar</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff22">
          <name><surname>de Wit</surname><given-names>Allard</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff23">
          <name><surname>Zachow</surname><given-names>Maximilian</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Athanasiadis</surname><given-names>Ioannis N.</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-2764-0078</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>Artificial Intelligence Group, Wageningen University and Research, P.O. Box 16, Wageningen, 6700 AA, the Netherlands</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>Chair of Data Science in Earth Observation, Technical University of Munich,  Arcisstraße 21, Munich, 80333, Germany</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>Department of Agronomy, Purdue University, 915 Mitch Daniels Blvd,  West Lafayette, IN 47907, United States</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>Department of Soil Science, University of Manitoba, 13 Freedman Crescent, Winnipeg, MB R3T 2N2, Canada</institution>
        </aff>
        <aff id="aff5"><label>5</label><institution>Department of Geographical Sciences, University of Maryland, 7251 Preinkert Drive,  Collega Park, MD 20742, United States</institution>
        </aff>
        <aff id="aff6"><label>6</label><institution>GISS Impacts Group, NASA Goddard Institute for Space Studies, 535 West 116th Street, Mail Code 4312, New York, NY 10027, United States</institution>
        </aff>
        <aff id="aff7"><label>7</label><institution>College of Computing, Mohammed VI Polytechnic University, Lot 660, Benguerir, 43150, Morocco</institution>
        </aff>
        <aff id="aff8"><label>8</label><institution>Institute for Environmental Studies, Vrije Universiteit Amsterdam,  De Boelelaan 1105, Amsterdam, 1081 HV, the Netherlands</institution>
        </aff>
        <aff id="aff9"><label>9</label><institution>Department of Climate Resilience, Potsdam Institute for Climate Impact Research,  P.O. Box 60 12 03, Potsdam, 4412, Germany</institution>
        </aff>
        <aff id="aff10"><label>10</label><institution>Department of Civil Engineering, University of Manitoba, 15 Gillson Street,  Winnipeg, MB R3T 5V6, Canada</institution>
        </aff>
        <aff id="aff11"><label>11</label><institution>Image Processing Laboratory, Universitat de València,  C/Catedràtic Agustín Escardino Benlloch, 9, València, 46980, Spain</institution>
        </aff>
        <aff id="aff12"><label>12</label><institution>Laboratory of Geo-Information Science and Remote Sensing, Wageningen University and Research,  P.O. Box 47, Wageningen, 6700 AA, the Netherlands</institution>
        </aff>
        <aff id="aff13"><label>13</label><institution>Seidor Consulting, Carrer dels Provençals 44, Barcelona, 08019, Spain</institution>
        </aff>
        <aff id="aff14"><label>14</label><institution>West and Central Africa Region Hub, International Crops Research Institute for the Semi-Arid Tropics, P.O. Box 320, Bamako, Mali</institution>
        </aff>
        <aff id="aff15"><label>15</label><institution>Natural Resources Management, International Institute of Tropical Agriculture, P.O. Box 30677, Nairobi, 00100, Kenya</institution>
        </aff>
        <aff id="aff16"><label>16</label><institution>Agriculture and Food, Commonwealth Scientific and Industrial Research Organisation (CSIRO), 147 Underwood Av, Perth, WA 6014, Australia</institution>
        </aff>
        <aff id="aff17"><label>17</label><institution>UMR LEPSE, National Research Institute for Agriculture, Food and Environment (INRAE), 2 Pl. Pierre Viala, Montpellier, 34000, France</institution>
        </aff>
        <aff id="aff18"><label>18</label><institution>Simulation and Data Science- Multiscale modelling and Forecasting,  Leibniz Centre for Agricultural Landscape Research, Eberswalder Straße 84, Müncheberg, 15374, Germany</institution>
        </aff>
        <aff id="aff19"><label>19</label><institution>Agricultural Leadership, Education, and Communications, Texas A&amp;M University,  600 John Kimbrough Blvd, College Station, TX 77843-2116, United States</institution>
        </aff>
        <aff id="aff20"><label>20</label><institution>Department of Computational Hydrosystems, Helmholtz Centre for Environmental Research,  Permoserstraße 15, Leipzig, 04318, Germany</institution>
        </aff>
        <aff id="aff21"><label>21</label><institution>Fincons s.p.a, Via Torri Bianche 10, Vimercate, 20871, Italy</institution>
        </aff>
        <aff id="aff22"><label>22</label><institution>Earth Observation and Environmental Informatics, Wageningen University and Research,  P.O. Box 47, Wageningen, 6700 AA, the Netherlands</institution>
        </aff>
        <aff id="aff23"><label>23</label><institution>Chair of Digital Agriculture, Technical University of Munich,  Liesel-Beckmann-Straße 2, Freising, 85354, Germany</institution>
        </aff><author-comment content-type="econtrib"><p>These authors contributed equally to this work.</p></author-comment>
      </contrib-group>
      <author-notes><corresp id="corr1">Michiel Kallenberg (michiel.kallenberg@wur.nl)</corresp></author-notes><pub-date><day>11</day><month>June</month><year>2026</year></pub-date>
      
      <volume>18</volume>
      <issue>6</issue>
      <fpage>3997</fpage><lpage>4018</lpage>
      <history>
        <date date-type="received"><day>17</day><month>February</month><year>2025</year></date>
           <date date-type="rev-request"><day>12</day><month>March</month><year>2025</year></date>
           <date date-type="rev-recd"><day>15</day><month>April</month><year>2026</year></date>
           <date date-type="accepted"><day>13</day><month>May</month><year>2026</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 Michiel Kallenberg et al.</copyright-statement>
        <copyright-year>2026</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026.html">This article is available from https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026.html</self-uri><self-uri xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026.pdf">The full text article is available as a PDF file from https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e566">In-season, pre-harvest crop yield forecasts are essential for enhancing transparency in commodity markets and improving food security. They play a key role in increasing resilience to climate change and extreme events and thus contribute to the United Nations’ Sustainable Development Goal 2 of zero hunger. Pre-harvest crop yield forecasting is a complex task, as several interacting factors contribute to yield formation, including in-season weather variability, extreme events, long-term climate change, soil, pests, diseases and farm management decisions. Several modeling approaches have been employed to capture complex interactions among such predictors and crop yields. Prior research for in-season, pre-harvest crop yield forecasting has primarily been case-study based, which makes it difficult to compare modeling approaches and measure progress systematically. To address this gap, we introduce CY-Bench (Crop Yield Benchmark), a comprehensive dataset and benchmark to forecast maize and wheat yields at a global scale. CY-Bench was conceptualized and developed within the Machine Learning team of the Agricultural Model Intercomparison and Improvement Project (AgML) in collaboration with agronomists, climate scientists, and machine learning researchers. It features publicly available sub-national yield statistics and relevant predictors, such as weather data, soil characteristics, and remote sensing indicators, that have been pre-processed, standardized, and harmonized across spatio-temporal scales. With CY-Bench, we aim to: (i) establish a standardized framework for developing and evaluating data-driven models across diverse farming systems in more than 25 countries across six continents; (ii) enable robust and reproducible model comparisons that address real-world operational challenges; (iii) provide an openly accessible dataset to the earth system science and machine learning communities, facilitating research on time series forecasting, domain adaptation, and online learning. The dataset (<ext-link xlink:href="https://doi.org/10.5281/zenodo.11502142" ext-link-type="DOI">10.5281/zenodo.11502142</ext-link>, <xref ref-type="bibr" rid="bib1.bibx42" id="altparen.1"/>) and accompanying code (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>, <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.2"/>) are openly available to support the continuous development of advanced data driven models for crop yield forecasting to enhance decision-making on food security.</p>
  </abstract>
    
<funding-group>
<award-group id="gs1">
<funding-source>HORIZON EUROPE Digital, Industry and Space</funding-source>
<award-id>101100622</award-id>
</award-group>
</funding-group>
</article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e590">The global food system faces significant challenges, including unequal access to resources and volatile markets, despite advancements in agricultural production <xref ref-type="bibr" rid="bib1.bibx1 bib1.bibx125 bib1.bibx13 bib1.bibx124 bib1.bibx96" id="paren.3"/> To enhance food security policies, experts have emphasized the need for improved data, maps, and predictions <xref ref-type="bibr" rid="bib1.bibx63 bib1.bibx23 bib1.bibx26" id="paren.4"/>. Pre-harvest yield forecasts, in particular, play a critical role in enhancing global market transparency and enabling decision-makers to plan and respond effectively to potential food shortages, especially in the face of a changing climate <xref ref-type="bibr" rid="bib1.bibx6 bib1.bibx105 bib1.bibx101" id="paren.5"/>.</p>
      <p id="d2e602">Crop yield forecasts are produced by both private entities and government institutes using field surveys, process-based crop models <xref ref-type="bibr" rid="bib1.bibx31" id="paren.6"/>, and data-driven methods. The latter include statistical regression (e.g., linear models with predefined assumptions) and machine learning (e.g., random forests, neural networks) <xref ref-type="bibr" rid="bib1.bibx4 bib1.bibx94 bib1.bibx75" id="paren.7"/>. Commonly used predictors are weather, soil moisture, crop productivity, and remotely-sensed vegetation health indicators. Data availability determines the yield forecasting modeling setup and the selected spatial scale, which can range from national to sub-national and field levels. For example, the European Commission's Joint Research Centre (EC-JRC) regularly produces national crop yield forecasts for the EU and surrounding countries using crop models, agro-meteorological analyses and the expertise of analysts <xref ref-type="bibr" rid="bib1.bibx112" id="paren.8"/>. In India, the Ministry of Agriculture generates multi-season crop production forecasts for major crops from remote sensing and agro-meteorological data using statistical and crop models <xref ref-type="bibr" rid="bib1.bibx100" id="paren.9"/>. In the United States, the USDA's National Agricultural Statistics Service (NASS) publishes monthly crop forecasts on a multi-stage administrative scale, primarily based on in-field surveys <xref ref-type="bibr" rid="bib1.bibx32" id="paren.10"/>. Data for sub-national crop yield forecasting, which focuses on higher resolution administrative units (e.g., regions, provinces) and captures spatial yield variability within a country <xref ref-type="bibr" rid="bib1.bibx65 bib1.bibx76" id="paren.11"/>, is crucial for targeted food security planning. Such data is usually publicly available, but compiling them for many countries is challenging due to differences in collection and reporting protocols, including language and data format.</p>
      <p id="d2e627">Traditionally, crop yield prediction has been based on biophysical process based crop models, grounded in decades of agricultural knowledge. Their challenges in parametrization <xref ref-type="bibr" rid="bib1.bibx34 bib1.bibx118 bib1.bibx99" id="paren.12"/> however limits scalability and their reliance on first principles hinders significant improvements in forecasting accuracy <xref ref-type="bibr" rid="bib1.bibx112" id="paren.13"/>. Machine learning methods offer promising alternatives, capturing processes not fully covered by biophysical models. However, they typically require high-quality datasets covering large areas and multiple years. Several review articles <xref ref-type="bibr" rid="bib1.bibx15 bib1.bibx44 bib1.bibx56 bib1.bibx113 bib1.bibx8 bib1.bibx74" id="paren.14"/> have highlighted promising performance of machine learning methods, including deep learning, for pre-harvest yield forecasting <xref ref-type="bibr" rid="bib1.bibx95 bib1.bibx123 bib1.bibx48 bib1.bibx62 bib1.bibx76 bib1.bibx25 bib1.bibx59 bib1.bibx55 bib1.bibx78 bib1.bibx116 bib1.bibx61 bib1.bibx83 bib1.bibx24" id="paren.15"/>. However, the data and code used in such studies are not always available, and the diversity in evaluation procedures, metrics, and datasets makes intercomparison and synthesis of results difficult. As a result, the research community is unable to reproduce results and compare the strengths and weaknesses of different methods across crops and regions.</p>
      <p id="d2e642">To better understand the specific strengths and weaknesses of data-driven methods for pre-harvest yield forecasting, and to drive future research progress, well-documented benchmark datasets compiled by domain experts are vital <xref ref-type="bibr" rid="bib1.bibx107 bib1.bibx21 bib1.bibx88 bib1.bibx103" id="paren.16"/>. While benchmark datasets can focus on specific regions or tasks, geographic diversity is a particularly valuable property for agricultural machine learning. Crop yield is influenced by highly variable and region-specific factors such as climate, farming practices, soil properties, and socioeconomic conditions. Datasets that span multiple countries and agro-ecological contexts help ensure that models are robust, transferable, and better equipped to generalize beyond well-studied regions <xref ref-type="bibr" rid="bib1.bibx85 bib1.bibx111" id="paren.17"/>. Including underrepresented or data-scarce regions also promotes research equity and allows the community to address the full spectrum of challenges in global food production <xref ref-type="bibr" rid="bib1.bibx71" id="paren.18"/>. In addition to producing accurate forecasts, models must be reliable in real-world settings for adoption by stakeholders <xref ref-type="bibr" rid="bib1.bibx112" id="paren.19"/>. The evaluation metrics should closely represent the needs of stakeholders and allow a more granular breakdown of model performance <xref ref-type="bibr" rid="bib1.bibx106 bib1.bibx12" id="paren.20"/> – for example, the model's ability to capture yield variability in years with climate extremes <xref ref-type="bibr" rid="bib1.bibx120" id="paren.21"/>. To avoid overestimation of model skill, the evaluation procedure must take into account the specific challenges arising from the use of spatio-temporal data that does not satisfy independent and identically distributed assumptions <xref ref-type="bibr" rid="bib1.bibx67 bib1.bibx102 bib1.bibx45 bib1.bibx86" id="paren.22"/>.</p>
      <p id="d2e668">A few research works have compiled benchmark-like datasets that include components related to crop yield prediction. SustainBench <xref ref-type="bibr" rid="bib1.bibx122" id="paren.23"/> includes a benchmark dataset for crop yield prediction, and targets end-of-season prediction for only one crop (soybean) in three countries (United States, Brazil and Argentina). Another public dataset is CropNet <xref ref-type="bibr" rid="bib1.bibx58" id="paren.24"/>, which only covers the United States. Similarly, there are ongoing efforts to produce a multi-task benchmark dataset which includes yield prediction in the USA as a sub-task <xref ref-type="bibr" rid="bib1.bibx37" id="paren.25"/>. Apart from these, other available data contributions include yield statistics only <xref ref-type="bibr" rid="bib1.bibx54 bib1.bibx82 bib1.bibx89 bib1.bibx20 bib1.bibx2 bib1.bibx3 bib1.bibx11 bib1.bibx14 bib1.bibx40 bib1.bibx66" id="paren.26"/> or sample data published with articles <xref ref-type="bibr" rid="bib1.bibx48 bib1.bibx28 bib1.bibx75 bib1.bibx78" id="paren.27"/> without releasing the full datasets.</p>
      <p id="d2e686">We present CY-Bench, a comprehensive dataset and benchmark for sub-national crop yield forecasting, covering thirty-eight countries for maize and twenty-nine countries for wheat across six continents. Here, sub-national refers to the administrative levels for which official crop statistics are published. Crop yield refers to the end-of-season yield reported in the statistics; and forecasting refers to the production of end-of-season yield estimates with a certain lead time before harvest (e.g., mid-season or 30 d before harvest). Thus, the dataset combines sub-national yield statistics with relevant predictors, such as growing-season weather, remote sensing indicators, and soil properties. The novelty of our contribution lies in the integration, harmonization, and standardization of multiple disparate sources into a single, analysis-ready benchmark. To our knowledge, this is the first publicly available dataset that enables consistent model comparison for sub-national yield forecasting across such a broad set of regions and production systems. Key novel aspects include: (i) facilitating benchmarking across countries rather than single-country datasets, filling a gap recently emphasized in the literature <xref ref-type="bibr" rid="bib1.bibx19 bib1.bibx103" id="paren.28"/>; (ii) harmonization of yield statistics, weather, soil, and remote sensing predictors with consistent spatial and temporal alignment; (iii) broad geographical coverage, explicitly including low- and middle-income countries that are often underrepresented in benchmarks; and (iv) development in collaboration with agricultural experts, climate scientists, and machine learning researchers from the AgML community (<uri>https://www.agml.org/</uri>, last access: 30 May 2026) who guided the selection and alignment of key variables and data sources and contributed to designing the dataset with benchmarking needs in mind. CY-Bench thus lowers the barrier to entry for machine learning researchers in this crucial application area, facilitates model intercomparison across diverse agricultural systems, and promotes reproducibility and transparency in agricultural forecasting. By providing an integrated, expert-curated benchmark, our work complements existing datasets that are either crop- or country-specific and enables the community to develop and evaluate forecasting tools that can support decision-makers in food security planning worldwide.</p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Dataset construction</title>
      <p id="d2e704">CY-Bench is a benchmark dataset to train and evaluate crop yield forecasting models that produce in-season forecasts with a certain lead time ahead of harvest. The benchmark includes a comprehensive set of predictors that are known to be important drivers of crop yield. Crop yield is determined by the complex interaction of genetics (G), environmental conditions (E), and management decisions (M), commonly referred to as <inline-formula><mml:math id="M1" display="inline"><mml:mrow><mml:mtext>G</mml:mtext><mml:mo>×</mml:mo><mml:mtext>E</mml:mtext><mml:mo>×</mml:mo><mml:mtext>M</mml:mtext></mml:mrow></mml:math></inline-formula>. Genetics (G) includes factors such as genotype, phenotype, and cultivar; environmental conditions (E) encompass both abiotic factors (e.g., climate, soil) and biotic factors (e.g., pests, pollinators); and management decisions (M) involve farm practices like tillage, sowing dates, irrigation, and fertilization <xref ref-type="bibr" rid="bib1.bibx57" id="paren.29"/>. Technological advancements, including genetic improvements, better farm inputs, machinery, and enhanced management practices, have all contributed to increased yields over time <xref ref-type="bibr" rid="bib1.bibx57" id="paren.30"/>. These advancements are often reflected in the yield trend <xref ref-type="bibr" rid="bib1.bibx52" id="paren.31"/>. At the sub-national spatial scale, data on genetic differences (e.g., cultivars) and farm management practices, with the exception of planting and harvest dates, are often not available. Therefore, previous studies of crop yield forecasting also commonly rely on environmental factors, crop calendar information (planting and harvest dates), and yield trend <xref ref-type="bibr" rid="bib1.bibx123 bib1.bibx48 bib1.bibx75" id="paren.32"/>. Factors not explicitly captured in CY-Bench but known to influence end-of-season yields are biotic stressors (e.g., pests and diseases), farm management choices (e.g., irrigation, fertilization, cultivar selection), and socioeconomic factors (e.g., market prices, labor availability, and policy changes).</p>
<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>Data sources selection</title>
      <p id="d2e742">In the absence of benchmark datasets like CY-Bench, modeling crop yield involves numerous uncertainties regarding data sources and quality. The data collection and pre-processing protocols of many predictor datasets, cropland or crop type maps, crop calendars and official statistics are important to select suitable data sources. Each data source has strengths and limitations related to spatial and temporal resolutions and coverage, sampling methods and gap-filling strategies. After data source selection, predictor data from diverse spatial resolutions needs to be aggregated (to the level of yield statistics), which can lead to information loss. In constructing CY-Bench, we engaged a diverse community of researchers to weigh the benefits and limitations of data sources for each type of data necessary to produce crop yield forecasts. The outcome is a curated set of sources, including alternative and our justifications for picking one data source over another. The selection process was guided by several principles: (i) global coverage, (ii) public accessibility, (iii) regular updates (except for inherently static datasets), (iv) near real-time availability, and (v) demonstrated relevance for crop growth and development. A summary of these decisions is provided in the dedicated data sections of this paper, while a more comprehensive overview, including specific benefits and limitations of each dataset considered, is available in our online documentation (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>, <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.33"/>). Each selected dataset is further described in accompanying data cards, which provide links to sources, reports, and related publications.</p>
<sec id="Ch1.S2.SS1.SSS1">
  <label>2.1.1</label><title>Weather and soil moisture data</title>
      <p id="d2e758">Weather is a key driver of crop yield variability  <xref ref-type="bibr" rid="bib1.bibx30" id="paren.34"/>, as it influences plant growth, development, and physiological processes through factors such as temperature, precipitation, and radiation. Derived weather variables such as vapour pressure deficit and evapotranspiration provide additional information on crop water demand and stress, which can improve yield prediction <xref ref-type="bibr" rid="bib1.bibx60 bib1.bibx104" id="paren.35"/>. Precipitation affects soil moisture availability, and evapotranspiration which is strongly influenced by vapour pressure deficit, governs water loss and stress risk. Although actual evapotranspiration would be preferred over reference evapotranspiration, the former is crop-dependent and not readily available at a global scale.</p>
      <p id="d2e767">Temperature (<monospace>temp</monospace>), precipitation (<monospace>prec</monospace>), radiation (<monospace>rad</monospace>), reference evapotranspiration (<monospace>ETo</monospace>), and vapor pressure deficit (<monospace>VPD</monospace>) were selected from AgERA5 <xref ref-type="bibr" rid="bib1.bibx9" id="paren.36"/>, which provides daily data at a 0.1° (<inline-formula><mml:math id="M2" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 11 km) spatial resolution. AgERA5 offers agrometeorological indicators from 1979 to the present, derived from ERA5 reanalysis and is tailored for agricultural studies. Its key benefits include high-quality data with near real-time updates (i.e. lag of <inline-formula><mml:math id="M3" display="inline"><mml:mo>∼</mml:mo></mml:math></inline-formula> 2 weeks), comprehensive documentation, and free access via the Copernicus Climate Data Store (CDS, <uri>https://cds.climate.copernicus.eu/#!/home</uri>, last access: 30 May 2026). Other datasets, such as PRISM, GridMET, TerraClimate, MSWEP, and CPC, have limitations including restricted geographic coverage, coarser temporal or spatial resolution, and fewer variables. A detailed comparison of candidate datasets and trade-offs is available on our Zenodo repository (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>; <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.37"/>).</p>
      <p id="d2e812">For soil moisture, we selected surface soil moisture (<monospace>SSM</monospace>) and root-zone soil moisture (<monospace>RSM</monospace>) from the Global Land Data Assimilation System (GLDAS) dataset <xref ref-type="bibr" rid="bib1.bibx87" id="paren.38"/>. This dataset represents gridded and global soil moisture data developed by integrating satellite- and ground-based observational data products, using advanced land surface modeling and data assimilation techniques. The dataset is available from 2003 to present, and can be freely downloaded from Goddard Earth Sciences Data and Information Services Center (GES DISC; <uri>https://disc.gsfc.nasa.gov/datasets?keywords=GLDAS</uri>, last access: 30 May 2026). It has a temporal resolution of one day, and a spatial resolution of 0.25° (<inline-formula><mml:math id="M4" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 28 km). An alternative dataset is the Global Land Evaporation Amsterdam Model (GLEAM) <xref ref-type="bibr" rid="bib1.bibx69" id="paren.39"/>, but it is typically updated only once a year and is currently available only until December 2023.</p>
</sec>
<sec id="Ch1.S2.SS1.SSS2">
  <label>2.1.2</label><title>Remote sensing data</title>
      <p id="d2e846">Remote sensing indicators of crop biomass and health include vegetation indices, such as the normalized difference vegetation index (<monospace>NDVI</monospace>) and enhanced vegetation index (<monospace>EVI</monospace>), as well as biophysical metrics like the fraction of absorbed photosynthetically active radiation (<monospace>fPAR</monospace>) and leaf area index (<monospace>LAI</monospace>). Sub-national yield forecasting requires long-term time series of these indicators, coupled with frequent satellite revisits to ensure cloud-free imagery. These requirements practically limit options to the coarse-resolution missions MODIS and its successor, VIIRS. While MODIS data can be directly downloaded from NASA Land Processes Distributed Active Archive Center (LPDACC), the raw vegetation indices and biophysical variables are often of low quality due to issues like cloud cover. These limitations require further screening, gap-filling, and corrections. Furthermore, additional processing, which includes the use of quality flags and the application of temporal smoothing procedures, is time-consuming and complex. These challenges become even more pronounced when processing near-real-time data, which is essential for operational yield forecasting.</p>
      <p id="d2e861">In view of an operational deployment of sub-national yield forecasting, we selected two analysis-ready operational products representing crop biomass and health: <monospace>fPAR</monospace> and <monospace>NDVI</monospace>. <monospace>fPAR</monospace> is provided as dekadal (10 d) data with a spatial resolution of 0.0045° (500 m), utilizing gap-filled and smoothed MODIS and VIIRS datasets. This data is sourced from EC-JRC (<uri>https://agricultural-production-hotspots.ec.europa.eu/data/indicators_fpar/</uri>, last access: 30 May 2026), and its quality is being evaluated in <xref ref-type="bibr" rid="bib1.bibx98" id="text.40"/>. <monospace>NDVI</monospace>, a key indicator of vegetation greenness, is derived from MOD09CMG <xref ref-type="bibr" rid="bib1.bibx115" id="paren.41"/>, available from NASA LPDACC. The data is prepared as an eight-day composite, selecting the pixel with the highest quality for each composite period. This interval offers a practical compromise: shorter composites tend to be noisier due to clouds, while longer intervals risk missing short-term vegetation dynamics and phenological changes. The data is provided at a spatial resolution of 0.05° (<inline-formula><mml:math id="M5" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 5 km). The quality of this <monospace>NDVI</monospace> product has been evaluated in <xref ref-type="bibr" rid="bib1.bibx64" id="text.42"/>.</p>
      <p id="d2e899">While <monospace>NDVI</monospace> can saturate under dense canopies, alternatives such as <monospace>EVI</monospace> and <monospace>GCVI</monospace> overcomes this limitation. We chose to focus on <monospace>fPAR</monospace> and <monospace>NDVI</monospace> because of their extensive use in crop yield studies, their direct link to canopy structure and light interception, and their availability as analysis-ready products. Moreover, <monospace>EVI</monospace> relies on empirical constants for canopy background adjustment, which can introduce calibration challenges across regions <xref ref-type="bibr" rid="bib1.bibx38" id="paren.43"/>.</p>
</sec>
<sec id="Ch1.S2.SS1.SSS3">
  <label>2.1.3</label><title>Soil data</title>
      <p id="d2e932">We selected data from the World Inventory of Soil Emission Potentials (WISE) project <xref ref-type="bibr" rid="bib1.bibx5" id="paren.44"/> for static soil properties. WISE data is constructed using the soil map unit delineations of the broad-scale Harmonized World Soil Database, overlaid by a climate zones map (Köppen-Geiger) as co-variate, and soil property estimates derived from analyses of the ISRIC-WISE soil profile database for the respective mapped “soil/climate” combinations. The dataset has a spatial resolution of 30 arcsec (0.00833° (<inline-formula><mml:math id="M6" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 0.9 km)).</p>
      <p id="d2e945">While SoilGrids <xref ref-type="bibr" rid="bib1.bibx35 bib1.bibx80" id="paren.45"/> is an alternative, WISE was selected due to its suitability for agricultural applications. Specifically, WISE data is considered to be more readily interpretable and provides essential parameters like soil rooting depth and water holding capacity, which are absent in SoilGrids.</p>
</sec>
<sec id="Ch1.S2.SS1.SSS4">
  <label>2.1.4</label><title>Crop mask and crop calendar data</title>
      <p id="d2e960">Crop masks are selected from the European Space Agency WorldCereal (ESA WorldCereal) project (<xref ref-type="bibr" rid="bib1.bibx114" id="altparen.46"/>), which provides an up-to-date and actively maintained source for cropland and crop type maps at a spatial resolution of 0.0045° (500 m). Alternative sources of crop masks include Anomaly Hotspots of Agricultural Production (ASAP) from EC-JRC and IIASA (JRC-IIASA) and Global Best Available Crop Specific Masks (GEOGLAM-BACS) from the Group on Earth Observations Global Agriculture Monitoring (GEOGLAM). We considered ESA WorldCereal to be a better choice than the generic cropland layer from JRC-IIASA because of the availability of crop type maps for maize and wheat (spring and winter cereals). Although GEOGLAM-BACS <xref ref-type="bibr" rid="bib1.bibx7" id="paren.47"/> provides crop type maps for maize and wheat (spring and winter cereals), their spatial resolution (0.05°) is lower compared to ESA WorldCereal (0.00464°).</p>
      <p id="d2e969">Crop calendars also come from the ESA WorldCereal project <xref ref-type="bibr" rid="bib1.bibx29" id="paren.48"/>. ESA WorldCereal crop calendars combine information from existing global crop calendar products, such as GEOGLAM Crop Monitor, the United States Department of Agriculture Foreign Agricultural Service (USDA-FAS), FAO, and EC-JRC's ASAP, into a baseline map and sample them to train a Random Forest algorithm based on climatic and geographic data. They have global coverage and a spatial resolution of 0.5° (<inline-formula><mml:math id="M7" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 50 km). We considered alternative sources, including Food and Agriculture Organization <xref ref-type="bibr" rid="bib1.bibx27" id="paren.49"/>, GGCMI <xref ref-type="bibr" rid="bib1.bibx117 bib1.bibx68" id="paren.50"/>, MIRCA <xref ref-type="bibr" rid="bib1.bibx81" id="paren.51"/>, and SAGE <xref ref-type="bibr" rid="bib1.bibx92" id="paren.52"/>. However, we selected ESA WorldCereal primarily due to its global coverage and alignment with our crop statistics data. A detailed comparison, based on crop types, country coverage, spatial resolution, and data sources, can be found in our Zenodo repository (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>; <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.53"/>).</p>
</sec>
<sec id="Ch1.S2.SS1.SSS5">
  <label>2.1.5</label><title>Crop statistics data</title>
      <p id="d2e1009">Crop yield statistics for sub-national administrative levels are obtained from national statistics offices or regional agencies, depending on their quality and timely availability. In most cases, they come from the national statistics offices. For example, in the United States, they are published by the National Agricultural Statistics Service (NASS) of the United States Department of Agriculture (USDA). For the European Union, member countries report statistics to Eurostat. However, we considered <xref ref-type="bibr" rid="bib1.bibx89" id="text.54"/> a more reliable source than Eurostat, as they follow a harmonization procedure developed by EC-JRC, standardizing crop definitions, administrative boundaries, and reporting practices to produce comparable annual yield time series. For Germany, we selected data from <xref ref-type="bibr" rid="bib1.bibx20" id="text.55"/> instead of <xref ref-type="bibr" rid="bib1.bibx89" id="text.56"/> because of better temporal coverage (1979–2021 vs. 1999–2020), higher spatial resolution for maize (NUTS level 3 vs. level 1) and better quality based on consistency checks (e.g., <inline-formula><mml:math id="M8" display="inline"><mml:mrow><mml:mi mathvariant="normal">yield</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="normal">production</mml:mi><mml:mo>/</mml:mo><mml:mi mathvariant="normal">area</mml:mi></mml:mrow></mml:math></inline-formula>). For Africa, except for Mali, data comes from the USAID's Famine Early Warning Systems Network (FEWS NET) Data Warehouse via the HarvestStat Africa dataset. The data was compiled by FEWS NET and NASA Harvest and harmonized by <xref ref-type="bibr" rid="bib1.bibx54" id="text.57"/> to account for changing administrative boundaries and reporting inconsistencies over time. For Mali, we selected Compagnie Malienne pour le Developpement des Textiles (CMDT) dataset <xref ref-type="bibr" rid="bib1.bibx39" id="paren.58"/> that provides higher spatial resolution data at arrondissement-level (administrative level 3). Depending on the country, the term “sub-national” can refer to administrative division 1 (province, state, region), division 2 (district), or division 3 (county, municipality, commune) (Table <xref ref-type="table" rid="T2"/>). When statistics for multiple administrative levels are available, we select the highest resolution.</p>
</sec>
</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title>Data preparation</title>
<sec id="Ch1.S2.SS2.SSS1">
  <label>2.2.1</label><title>Crop yield data (targets)</title>
      <p id="d2e1062">CY-Bench dataset includes crop statistics from thirty-eight countries for maize and twenty-nine countries for wheat (Fig. <xref ref-type="fig" rid="F3"/>). Coverage maps show that CY-Bench has extensive coverage when layered on top of crop type maps from ESA WorldCereal, with notable omissions including Canada, Ukraine and Russia for wheat and Ukraine, Uganda and Tanzania for maize. Data preparation for yield data involved filtering out values that do not meet certain consistency checks, e.g., <inline-formula><mml:math id="M9" display="inline"><mml:mrow><mml:mi mathvariant="normal">yield</mml:mi><mml:mo>≠</mml:mo><mml:mi mathvariant="normal">production</mml:mi><mml:mo>/</mml:mo><mml:mi mathvariant="normal">area</mml:mi></mml:mrow></mml:math></inline-formula>, or zero values. The data sources or publications from which CY-Bench draws the data do additional consistency checks. We refer interested readers to respective data cards <xref ref-type="bibr" rid="bib1.bibx84" id="paren.59"/> in our Zenodo repository (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>; <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.60"/>) which contains further links to data sources, related reports and publications.</p>
</sec>
<sec id="Ch1.S2.SS2.SSS2">
  <label>2.2.2</label><title>Predictor data</title>
      <p id="d2e1100">CY-Bench predictor data includes static soil properties and time series of weather variables, soil moisture indicators and vegetation indicators (Table <xref ref-type="table" rid="T1"/>). Predictor data and yield statistics often differ in spatial and temporal resolution, requiring further processing to align them effectively. While such aggregation can mask fine-scale variability or temporal dynamics, it can also smooth out noise and improve the stability of predictors <xref ref-type="bibr" rid="bib1.bibx36 bib1.bibx77" id="paren.61"/>. Weather, <monospace>ETo</monospace> and soil moisture data come in daily time steps. <monospace>fPAR</monospace> comes in dekadal time step, with three values per month (days 1–10, 11–20, 21–31). <monospace>NDVI</monospace> data is available every eight days, with gaps due to cloud cover.</p>

<table-wrap id="T1" specific-use="star"><label>Table 1</label><caption><p id="d2e1120">Overview of the predictor data, crop mask and crop calendar.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="6">
     <oasis:colspec colnum="1" colname="col1" align="justify" colwidth="2cm"/>
     <oasis:colspec colnum="2" colname="col2" align="justify" colwidth="1.7cm"/>
     <oasis:colspec colnum="3" colname="col3" align="justify" colwidth="1.3cm"/>
     <oasis:colspec colnum="4" colname="col4" align="justify" colwidth="2.5cm"/>
     <oasis:colspec colnum="5" colname="col5" align="justify" colwidth="1.3cm"/>
     <oasis:colspec colnum="6" colname="col6" align="justify" colwidth="6cm"/>
     <oasis:thead>
       <oasis:row>

         <oasis:entry colname="col1" align="left">Category</oasis:entry>

         <oasis:entry rowsep="1" namest="col2" nameend="col3" align="center">Data </oasis:entry>

         <oasis:entry rowsep="1" colname="col4" morerows="1" align="left">Spatial  resolution</oasis:entry>

         <oasis:entry rowsep="1" colname="col5" morerows="1" align="left">Temporal  resolution</oasis:entry>

         <oasis:entry colname="col6" align="left">Source</oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1" align="left"/>

         <oasis:entry colname="col2" align="left">Name</oasis:entry>

         <oasis:entry colname="col3" align="left">Unit</oasis:entry>

         <oasis:entry colname="col6" align="left"/>

       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>

         <oasis:entry colname="col1" align="left">Weather  (time series)</oasis:entry>

         <oasis:entry rowsep="1" colname="col2" align="left">temp  prec  rad  ET0  VPD</oasis:entry>

         <oasis:entry rowsep="1" colname="col3" align="left">°C  mm  J m<sup>−2</sup>  mm  hPa</oasis:entry>

         <oasis:entry rowsep="1" colname="col4" align="left">0.1°  (11 km)</oasis:entry>

         <oasis:entry rowsep="1" colname="col5" align="left">daily</oasis:entry>

         <oasis:entry rowsep="1" colname="col6" align="left">AgERA5 <xref ref-type="bibr" rid="bib1.bibx9" id="paren.62"/></oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col1" align="left"/>

         <oasis:entry rowsep="1" colname="col2" align="left">CWB</oasis:entry>

         <oasis:entry rowsep="1" colname="col3" align="left">mm</oasis:entry>

         <oasis:entry rowsep="1" colname="col4" align="left">0.1° (11 km)</oasis:entry>

         <oasis:entry rowsep="1" colname="col5" align="left">daily</oasis:entry>

         <oasis:entry rowsep="1" colname="col6" align="left">Computed as prec – ETo</oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1" align="left"/>

         <oasis:entry colname="col2" align="left">soil moisture</oasis:entry>

         <oasis:entry colname="col3" align="left">kg m<sup>−2</sup></oasis:entry>

         <oasis:entry colname="col4" align="left">0.25°  (28 km)</oasis:entry>

         <oasis:entry colname="col5" align="left">daily</oasis:entry>

         <oasis:entry colname="col6" align="left">NASA GLDAS <xref ref-type="bibr" rid="bib1.bibx87" id="paren.63"/></oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1" align="left">Vegetation  (time series)</oasis:entry>

         <oasis:entry colname="col2" align="left">fPAR  NDVI</oasis:entry>

         <oasis:entry colname="col3" align="left">%  –</oasis:entry>

         <oasis:entry colname="col4" align="left">0.0045°  (0.5 km)  0.05°  (5.5 km)</oasis:entry>

         <oasis:entry colname="col5" align="left">10 d  8 d</oasis:entry>

         <oasis:entry colname="col6" align="left">JRC <xref ref-type="bibr" rid="bib1.bibx98" id="paren.64"/>  MOD09CMG <xref ref-type="bibr" rid="bib1.bibx115" id="paren.65"/></oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1" align="left">Soil  (static)</oasis:entry>

         <oasis:entry colname="col2" align="left">AWC  bulk density  drainage class</oasis:entry>

         <oasis:entry colname="col3" align="left">cm m<sup>−1</sup>  kg dm<sup>−3</sup>  –</oasis:entry>

         <oasis:entry colname="col4" align="left">0.0083°  (0.9 km)</oasis:entry>

         <oasis:entry colname="col5" align="left">static</oasis:entry>

         <oasis:entry colname="col6" align="left">WISE <xref ref-type="bibr" rid="bib1.bibx5" id="paren.66"/></oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1" align="left">Location  (static)</oasis:entry>

         <oasis:entry colname="col2" align="left">latitude  longitude</oasis:entry>

         <oasis:entry colname="col3" align="left">degrees  degrees</oasis:entry>

         <oasis:entry colname="col4" align="left"/>

         <oasis:entry colname="col5" align="left">static  static</oasis:entry>

         <oasis:entry colname="col6" align="left"/>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col1" align="left">Crop  (auxiliary)</oasis:entry>

         <oasis:entry colname="col2" align="left">crop mask  crop calendar</oasis:entry>

         <oasis:entry colname="col3" align="left">%  day</oasis:entry>

         <oasis:entry colname="col4" align="left">0.0045°  (0.5 km)  0.5°  (55 km)</oasis:entry>

         <oasis:entry colname="col5" align="left">static  static</oasis:entry>

         <oasis:entry colname="col6" align="left">WorldCereal <xref ref-type="bibr" rid="bib1.bibx114 bib1.bibx22" id="paren.67"/>  WorldCereal <xref ref-type="bibr" rid="bib1.bibx29" id="paren.68"/></oasis:entry>

       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table><table-wrap-foot><p id="d2e1123">Abbreviations: Temperature (<monospace>temp</monospace>), Precipitation flux (<monospace>prec</monospace>), Solar radiation flux (<monospace>rad</monospace>), Reference evapotranspiration (<monospace>ETo</monospace>), Vapor pressure deficit (<monospace>VPD</monospace>), Climatic water balance (<monospace>CWB</monospace>), Fraction of absorbed photosynthetically active radiation (<monospace>fPAR</monospace>), Normalized difference vegetation index (<monospace>NDVI</monospace>), and available water capacity (<monospace>AWC</monospace>).</p></table-wrap-foot></table-wrap>

<table-wrap id="T2" specific-use="star"><label>Table 2</label><caption><p id="d2e1490">Countries and the administrative levels for which CY-Bench data is provided.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="4">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Group</oasis:entry>
         <oasis:entry namest="col2" nameend="col4" align="center">Country name (country code): Admin level or NUTS Level </oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">EU</oasis:entry>
         <oasis:entry colname="col2">Austria (AT): 2</oasis:entry>
         <oasis:entry colname="col3">Belgium (BE): 2</oasis:entry>
         <oasis:entry colname="col4">Bulgaria (BG): 2</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">(<inline-formula><mml:math id="M14" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">23</mml:mn></mml:mrow></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col2">Czechia (CZ): 3</oasis:entry>
         <oasis:entry colname="col3">Germany (DE): 3</oasis:entry>
         <oasis:entry colname="col4">Denmark (DK) : 3</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Estonia (EE): 3</oasis:entry>
         <oasis:entry colname="col3">Greece (EL): 3</oasis:entry>
         <oasis:entry colname="col4">Spain (ES): 3</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Finland (FI): 3</oasis:entry>
         <oasis:entry colname="col3">France (FR): 3</oasis:entry>
         <oasis:entry colname="col4">Croatia (HR): 2</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Hungary (HU): 3</oasis:entry>
         <oasis:entry colname="col3">Ireland (IE): 2</oasis:entry>
         <oasis:entry colname="col4">Italy (IT): 3</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Lithuania (LT): 3</oasis:entry>
         <oasis:entry colname="col3">Latvia (LV): 3</oasis:entry>
         <oasis:entry colname="col4">Netherlands (NL): 2</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Poland (PL): 2</oasis:entry>
         <oasis:entry colname="col3">Portugal (PT): 2</oasis:entry>
         <oasis:entry colname="col4">Romania (RO): 3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Sweden (SE): 3</oasis:entry>
         <oasis:entry colname="col3">Slovakia (SK): 3</oasis:entry>
         <oasis:entry colname="col4"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">FEWSNET</oasis:entry>
         <oasis:entry colname="col2">Angola (AO): 1</oasis:entry>
         <oasis:entry colname="col3">Burkina Faso (BF): 2</oasis:entry>
         <oasis:entry colname="col4">Ethiopia (ET): 2</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">(<inline-formula><mml:math id="M15" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">12</mml:mn></mml:mrow></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col2">Lesotho (LS): 1</oasis:entry>
         <oasis:entry colname="col3">Madagascar (MG): 2</oasis:entry>
         <oasis:entry colname="col4">Malawi (MW): 2</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Mozambique (MZ): 1</oasis:entry>
         <oasis:entry colname="col3">Niger (NE): 2</oasis:entry>
         <oasis:entry colname="col4">Senegal (SN): 2</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Chad (TD): 1</oasis:entry>
         <oasis:entry colname="col3">South Africa (ZA): 1</oasis:entry>
         <oasis:entry colname="col4">Zambia (ZM): 2</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Other countries</oasis:entry>
         <oasis:entry colname="col2">Argentina (AR): department</oasis:entry>
         <oasis:entry colname="col3">Australia (AU): ABARES region (sub-state)</oasis:entry>
         <oasis:entry colname="col4"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">(<inline-formula><mml:math id="M16" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">8</mml:mn></mml:mrow></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col2">Brazil (BR): municipality</oasis:entry>
         <oasis:entry colname="col3">China (CN): province</oasis:entry>
         <oasis:entry colname="col4"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">India (IN): district</oasis:entry>
         <oasis:entry colname="col3">Mali (ML): Municipality</oasis:entry>
         <oasis:entry colname="col4"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Mexico (MX): state</oasis:entry>
         <oasis:entry colname="col3">United States (US): county</oasis:entry>
         <oasis:entry colname="col4"/>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e1786">Predictor data is filtered using crop type maps (or crop masks) from <xref ref-type="bibr" rid="bib1.bibx22" id="text.69"/> which are derived from the ESA WorldCereal project <xref ref-type="bibr" rid="bib1.bibx114" id="paren.70"/>. This step restricts predictor data to pixels in harvested crop areas only. After masking, predictor data is aggregated to match the boundaries and spatial level of the yield data according to the administrative level (Fig. <xref ref-type="fig" rid="F1"/>). The data preparation workflow is implemented in a Python script in our GitHub repository (<uri>https://github.com/WUR-AI/AgML-CY-Bench/tree/main/data_preparation/predictor_data_prep.py</uri>, last access:  30 May 2026; <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.71"/>). We note that all predictor data retain their temporal resolution from the original data source, creating a multi-modal dataset.</p>

      <fig id="F1" specific-use="star"><label>Figure 1</label><caption><p id="d2e1805">Overview of the CY-Bench data preparation process.</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026-f01.jpg"/>

          </fig>


</sec>
<sec id="Ch1.S2.SS2.SSS3">
  <label>2.2.3</label><title>Additional pre-processing for yield forecasting models</title>
      <p id="d2e1824">Here we describe some additional pre-processing implemented in our <monospace>cybench</monospace> library that are relevant for building crop yield forecasting models. Predictor data from different sources come with different temporal coverage. Similarly, they include observations for the calendar year, which may not capture the crop season. First, we align time series inputs (weather variables, remote sensing indicators and soil moisture indicators) to the crop season (see Fig. <xref ref-type="fig" rid="F2"/>). We define the boundaries of the crop season as 90 d before the start of season (the spin-up time) to the end of season in a particular calendar year and filter out data outside the boundaries. Therefore, data from the previous year can be included in the current calendar year's crop season and data after the end-of-season date get pushed to the crop season for the next calendar year. Furthermore, data towards the end-of-season are filtered out based on the lead time relative to harvest or end-of-season. Second, we align the input data sources and label data to produce a set of data samples that are complete, i.e. each data sample includes all the relevant predictors for each time step (or static) and a label.</p>

      <fig id="F2" specific-use="star"><label>Figure 2</label><caption><p id="d2e1834">Alignment of time series predictors to the crop season.</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026-f02.png"/>

          </fig>

      <fig id="F3" specific-use="star"><label>Figure 3</label><caption><p id="d2e1845">Coverage of CY-Bench for maize (38 countries) and wheat (29 countries) overlaid on crop type maps from ESA WorldCereal. Coverage is extensive, with notable omissions including Ukraine, Uganda, and Tanzania for maize, and Canada, Ukraine, and Russia for wheat. Some administrative units are covered despite no visible crop mask; an apparent mismatch caused by thresholding of low-percentage crop mask pixels (e.g., Tasmania contains only a few hectares of wheat).</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026-f03.jpg"/>

          </fig>

      <p id="d2e1855">The time series predictors need further pre-processing during modeling. Certain models require time series data to have the same number of time steps. Therefore, time series inputs are aggregated to dekadal time steps (days 1–10, 11–20, 21–30, and so on), taking the mean of most variables, minimum of minimum temperature, maximum of maximum temperature and the sum of precipitation flux, climatic water balance and solar radiation flux. Where the variable is categorical (such as soil drainage), we take the mode.</p>
      <p id="d2e1858">To further prepare features as tabular data, time series data are aggregated in the temporal dimension to create domain-relevant features. Following expert recommendations we create monthly averages of minimum daily temperature (<monospace>tmin</monospace>), maximum daily temperature (<monospace>tmax</monospace>), average daily temperature, daily precipitation (<monospace>prec</monospace>), cumulative climatic water balance (<monospace>prec</monospace> <inline-formula><mml:math id="M17" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula> <monospace>ETo</monospace>) and surface soil moisture. Similarly, monthly maximum values are calculated for cumulative growing degree days (<monospace>GGD</monospace>), cumulative precipitation, cumulative <monospace>fPAR</monospace> and cumulative <monospace>NDVI</monospace>. Furthermore, we calculate the number of days in which <monospace>tmin</monospace> is less than 0 °C (“cold days”), days in which <monospace>tmax</monospace> is greater than 35 °C (“hot days”) and days where <monospace>prec</monospace> is less than 1 mm (“dry days”).</p>
</sec>
<sec id="Ch1.S2.SS2.SSS4">
  <label>2.2.4</label><title>Future expansion and data integration</title>
      <p id="d2e1911">CY-Bench currently includes predictor data from 2003 through 2023. Availability of crop statistics varies by country (see Tables <xref ref-type="table" rid="T3"/>, <xref ref-type="table" rid="T4"/>). We share yield and predictor data preparation scripts and notebooks in our Zenodo repository (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>; <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.72"/>). to make the inclusion of new data possible as it becomes available. For example, when crop statistics for new data years become available for specific countries, the data preparation pipeline for agricultural yield data can be run for the crop statistics, and predictor data preparation scripts can be run for predictor inputs. Expanding the database in the future primarily depends on onboarding crop statistics, as the global availability of input predictors ensures that integrating additional crop statistics is the only prerequisite for extending CY-Bench's coverage.</p>

<table-wrap id="T3" specific-use="star"><label>Table 3</label><caption><p id="d2e1928">Data size summary per dataset for EU countries.</p></caption>
  <graphic xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026-t03.png"/>
</table-wrap>

<table-wrap id="T4" specific-use="star"><label>Table 4</label><caption><p id="d2e1939">Data size summary per dataset for other (non-EU) countries.</p></caption>
  <graphic xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026-t04.png"/>
</table-wrap>

</sec>
</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Dataset and task summary</title>
<sec id="Ch1.S3.SS1">
  <label>3.1</label><title>Dataset overview</title>
      <p id="d2e1964">CY-Bench covers two main crops, namely maize and wheat. Depending on the country, the crop names can refer to different varieties or seasons of maize and wheat as detailed in our Zenodo repository (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>; <xref ref-type="bibr" rid="bib1.bibx43" id="altparen.73"/>).</p>
</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title>Task</title>
      <p id="d2e1981">CY-Bench is designed to train and evaluate models for in-season crop yield forecasting of wheat and maize at the sub-national level, covering major and underrepresented crop-growing countries worldwide. Forecasts can be made at multiple time points from start of season (<monospace>sos</monospace>) to end of season (<monospace>eos</monospace>), based on a lead time relative to <monospace>eos</monospace>, e.g., middle-of-season (<inline-formula><mml:math id="M18" display="inline"><mml:mrow><mml:mo>(</mml:mo><mml:mtext mathvariant="monospace">eos</mml:mtext><mml:mo>-</mml:mo><mml:mtext mathvariant="monospace">sos</mml:mtext><mml:mo>)</mml:mo><mml:mo>/</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula>), quarter-of-season (<inline-formula><mml:math id="M19" display="inline"><mml:mrow><mml:mo>(</mml:mo><mml:mtext mathvariant="monospace">eos</mml:mtext><mml:mo>-</mml:mo><mml:mtext mathvariant="monospace">sos</mml:mtext><mml:mo>)</mml:mo><mml:mo>/</mml:mo><mml:mn mathvariant="normal">4</mml:mn></mml:mrow></mml:math></inline-formula>) and <inline-formula><mml:math id="M20" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula>-days before harvest. The exact inference time depends on the crop calendar for the selected crop and region. The quarter-of-season mark often coincides with crops reaching physiological maturity, while the middle-of-season typically represents the transition from vegetative to reproductive growth stages <xref ref-type="bibr" rid="bib1.bibx53 bib1.bibx4" id="paren.74"/>. The reproductive period, which includes flowering and grain filling, is generally the most climate-sensitive phase of the growing season <xref ref-type="bibr" rid="bib1.bibx33" id="paren.75"/>. By contrast, the vegetative phase before mid-season and the senescence phase after grain filling tend to be less sensitive to climate anomalies, although rainfall during the harvest period can significantly impact yield. While quarter-of-season forecasts may achieve higher accuracy, middle-of-season forecasts balance accuracy with actionable insights, allowing for management adjustments during the remainder of the growing season – something late forecasts cannot provide.</p>
<sec id="Ch1.S3.SS2.SSSx1" specific-use="unnumbered">
  <title>Formal definition</title>
      <p id="d2e2052">The input data consists of time series inputs (weather, soil moisture, and vegetation indices) and static inputs (soil properties). Let <inline-formula><mml:math id="M21" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">x</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> represent the vector of time series inputs at time <inline-formula><mml:math id="M22" display="inline"><mml:mi>t</mml:mi></mml:math></inline-formula>, where <inline-formula><mml:math id="M23" display="inline"><mml:mi>t</mml:mi></mml:math></inline-formula> spans from <monospace>sos</monospace> up to the inference point <inline-formula><mml:math id="M24" display="inline"><mml:mi>T</mml:mi></mml:math></inline-formula>. Time series data up to the inference point is represented as <inline-formula><mml:math id="M25" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mtext>sos</mml:mtext><mml:mo>:</mml:mo><mml:mi>T</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="bold-italic">x</mml:mi><mml:mtext>sos</mml:mtext></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi mathvariant="bold-italic">x</mml:mi><mml:mrow><mml:mtext>sos</mml:mtext><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mi mathvariant="normal">…</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mi mathvariant="bold-italic">x</mml:mi><mml:mi>T</mml:mi></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula> and static inputs as <inline-formula><mml:math id="M26" display="inline"><mml:mi mathvariant="bold-italic">z</mml:mi></mml:math></inline-formula>. Each training or testing sample <inline-formula><mml:math id="M27" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula> corresponds to a specific region-season pair <inline-formula><mml:math id="M28" display="inline"><mml:mrow><mml:mo>(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>s</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>. For each training sample <inline-formula><mml:math id="M29" display="inline"><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>s</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, the input consists of <inline-formula><mml:math id="M30" display="inline"><mml:mrow><mml:msubsup><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mtext>sos</mml:mtext><mml:mo>:</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M31" display="inline"><mml:mrow><mml:msup><mml:mi mathvariant="bold-italic">z</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>. The target is the end-of-season yield <inline-formula><mml:math id="M32" display="inline"><mml:mrow><mml:msup><mml:mi>Y</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for the corresponding region <inline-formula><mml:math id="M33" display="inline"><mml:mi>r</mml:mi></mml:math></inline-formula> and season <inline-formula><mml:math id="M34" display="inline"><mml:mi>s</mml:mi></mml:math></inline-formula>. The objective is to learn a mapping function <inline-formula><mml:math id="M35" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula> such that <inline-formula><mml:math id="M36" display="inline"><mml:mrow><mml:msup><mml:mi>Y</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup><mml:mo>=</mml:mo><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msubsup><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mtext>sos</mml:mtext><mml:mo>:</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msup><mml:mi mathvariant="bold-italic">z</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup><mml:mo>;</mml:mo><mml:mi mathvariant="italic">θ</mml:mi><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:msup><mml:mi mathvariant="italic">ϵ</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="M37" display="inline"><mml:mi mathvariant="italic">θ</mml:mi></mml:math></inline-formula> represents the model parameters, and <inline-formula><mml:math id="M38" display="inline"><mml:mrow><mml:msup><mml:mi mathvariant="italic">ϵ</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> is the error term.</p>
      <p id="d2e2362">During testing, the model gets <inline-formula><mml:math id="M39" display="inline"><mml:mrow><mml:msubsup><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mtext>sos</mml:mtext><mml:mo>:</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi>j</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula> from the start of the season (<monospace>sos</monospace>) up to the inference point <inline-formula><mml:math id="M40" display="inline"><mml:mi>T</mml:mi></mml:math></inline-formula> and static inputs <inline-formula><mml:math id="M41" display="inline"><mml:mrow><mml:msup><mml:mi mathvariant="bold-italic">z</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>j</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for a new sample <inline-formula><mml:math id="M42" display="inline"><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>,</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>. The model then forecasts the end-of-season yield <inline-formula><mml:math id="M43" display="inline"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>Y</mml:mi><mml:mo mathvariant="normal" stretchy="false">^</mml:mo></mml:mover><mml:mrow><mml:mo>(</mml:mo><mml:mi>j</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup><mml:mo>=</mml:mo><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msubsup><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mtext>sos</mml:mtext><mml:mo>:</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi>j</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msup><mml:mi mathvariant="bold-italic">z</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>j</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup><mml:mo>;</mml:mo><mml:mover accent="true"><mml:mi mathvariant="italic">θ</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="M44" display="inline"><mml:mover accent="true"><mml:mi mathvariant="italic">θ</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover></mml:math></inline-formula> are the model parameters learned during training. Model performance is evaluated by comparing yield forecasts <inline-formula><mml:math id="M45" display="inline"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>Y</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mrow><mml:mo>(</mml:mo><mml:mi>j</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> with reported yields <inline-formula><mml:math id="M46" display="inline"><mml:mrow><mml:msup><mml:mi>Y</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>j</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>.</p>
      <p id="d2e2549">Some details that are ignored in the above formulation: <list list-type="bullet"><list-item>
      <p id="d2e2554"><inline-formula><mml:math id="M47" display="inline"><mml:mi>t</mml:mi></mml:math></inline-formula> can actually start earlier than <monospace>sos</monospace>, based on spin-up time (e.g., 60 or 90 d before <monospace>sos</monospace>).</p></list-item><list-item>
      <p id="d2e2570">The temporal resolution can be different for time series inputs, i.e. the <inline-formula><mml:math id="M48" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> in <inline-formula><mml:math id="M49" display="inline"><mml:mrow><mml:mtext mathvariant="monospace">sos</mml:mtext><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> represents different time units.</p></list-item></list></p>
</sec>
</sec>
<sec id="Ch1.S3.SS3">
  <label>3.3</label><title>Training, validation and test splits</title>
      <p id="d2e2604">We closely mimic real-world operational settings in the predictor data used, data pre-processing steps and evaluation setup. Specifically, we adopt Leave-One-Year-Out validation (LOYO), which is more appropriate for this type of agricultural problem compared to the random sampling methods commonly used in prior studies <xref ref-type="bibr" rid="bib1.bibx86" id="paren.76"/>, including SustainBench <xref ref-type="bibr" rid="bib1.bibx122" id="paren.77"/>. Yields from neighboring regions in the same year are typically correlated, so random sampling can cause data leakage: information from the same year appears in both training and testing sets. This violates the independent and identically distributed (IID) assumption and produces overly optimistic performance estimates. LOYO avoids this by holding out an entire year, ensuring that correlations within that year are only encountered during evaluation. It also guarantees that extreme yield years are fully represented, rather than being diluted across random splits.</p>
      <p id="d2e2613">Our library computes the following evaluation metrics: normalized root mean squared error (NRMSE; i.e., the root mean squared error normalized by the average yield of the test set), mean absolute percentage error (MAPE), and <inline-formula><mml:math id="M50" display="inline"><mml:mi>R</mml:mi></mml:math></inline-formula>-squared (<inline-formula><mml:math id="M51" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>). These metrics are computed by averaging over all cross-validation test folds (which covers the complete dataset for LOYO) and all admin regions with a country.</p>
</sec>
</sec>
<sec id="Ch1.S4">
  <label>4</label><title>Discussion</title>
<sec id="Ch1.S4.SS1">
  <label>4.1</label><title>Impact</title>
      <p id="d2e2650">In addition to the relevance for climate change, food security and the United Nations' sustainable development goals, CY-Bench dataset is relevant to the earth systems science and machine learning research communities due to its comprehensive geographic coverage, capturing diverse agricultural practices and conditions. The inclusion of (indicators derived from) satellite imagery, weather data, and soil properties provides a rich, heterogeneous dataset that presents numerous opportunities for the development of innovative machine learning methods. An inherent challenge of agricultural data, and crop-yield forecasting specifically, is the high level of domain knowledge required in collecting and processing the various data types and defining the task. This analysis-ready dataset is accessible to modelers who do not necessarily have expertise in yield forecasting, lowering the barrier to entry for advanced yield forecasting research and fostering broader participation and innovation in the field.</p>
      <p id="d2e2653">To illustrate the potential of CY-Bench for crop yield prediction, we provide initial benchmarking results using several machine learning models in the accompanying code repository. These results offer a preliminary sense of model performance across regions and model choices and show that the predictive value of features in CY-Bench varies. This highlights the complexity of yield prediction across diverse landscapes and underscores the importance of CY-Bench as a standardized benchmark to study these differences systematically for data-rich and -sparse regions. While these results are only illustrative, a full comparison of methods, including systematic benchmarking and analysis of findings relative to existing datasets will be addressed in a dedicated follow-up study. We emphasize that the purpose of CY-Bench is to support comparative evaluation of modeling approaches under realistic and widely available data constraints, rather than to define an upper bound on achievable yield prediction accuracy.</p>
      <p id="d2e2656">Beyond academic research, this dataset can significantly impact policy-making, agricultural planning, and disaster response by enabling the robust evaluation and development of operational models. Researchers, policymakers, farmers, and agribusinesses can benefit from the insights derived from this dataset, leading to better-informed decisions and improved agricultural outcomes.</p>
</sec>
<sec id="Ch1.S4.SS2">
  <label>4.2</label><title>Limitations</title>
      <p id="d2e2667">We also would like to point out several limitations of CY-Bench that can also be areas for improvement in future iterations. <list list-type="custom"><list-item><label>1.</label>
      <p id="d2e2672">Some limitations stem from the data sources available in the public domain. <list list-type="custom"><list-item><label>–</label>
      <p id="d2e2677">The predictors do not capture certain factors that influence end-of-season yields, such as pests, diseases, and farm management choices. Similarly, CY-Bench excludes socioeconomic factors such as market prices, labor availability, and policy changes. Some of these omitted factors, like crop varieties and management practices, might exhibit spatial or temporal correlations. Consequently, these factors could be partially captured by incorporating spatial or temporal embeddings within a model. Other factors, such as pests, are less likely to be adequately captured in this way. Including these variables could provide a more holistic understanding of yield fluctuations and help develop more robust models. Nevertheless, the availability of such data on a global scale is typically difficult or often not feasible.</p></list-item><list-item><label>–</label>
      <p id="d2e2681">The crop masks and crop calendars included in CY-Bench are static, i.e. they do not reflect yearly changes. While dynamic, up-to-date masks could improve data quality, the availability of consistent, high-quality, global-scale dynamic masks remains limited – a challenge shared by many yield prediction and benchmarking efforts <xref ref-type="bibr" rid="bib1.bibx46 bib1.bibx122" id="paren.78"/>. Regional, high-resolution products exist (e.g., the USDA Cropland Data Layer; <xref ref-type="bibr" rid="bib1.bibx10" id="altparen.79"/>), but their inclusion would break the harmonization across countries central to CY-Bench. We considered incorporating dynamic global products, such as the recently released MIRCA-OS dataset <xref ref-type="bibr" rid="bib1.bibx46" id="paren.80"/>. However, we prioritized spatial precision over temporal dynamics: MIRCA-OS has a significantly coarser resolution (0.0833°, <inline-formula><mml:math id="M52" display="inline"><mml:mo>∼</mml:mo></mml:math></inline-formula> 10 km) compared to our current mask (0.0045°, <inline-formula><mml:math id="M53" display="inline"><mml:mo>∼</mml:mo></mml:math></inline-formula> 0.5 km), which introduces systematic mixed-pixel bias at sub-national scales. To validate this design choice, we conducted a sensitivity analysis comparing signal variability driven by mask changes versus natural interannual vegetation dynamics (see Appendix A). We found that the variability introduced by mask changes is minor (median relative variability <inline-formula><mml:math id="M54" display="inline"><mml:mo>≈</mml:mo></mml:math></inline-formula> 2 %) compared to the interannual signal variability. For the purpose of regional yield forecasting, the stochastic noise from a static mask was deemed preferable to the systematic bias of coarser dynamic masks. Future iterations of CY-Bench will evaluate high-resolution dynamic masks as they become globally available.</p></list-item><list-item><label>–</label>
      <p id="d2e2716">The crop calendar information included in CY-Bench is limited to start-of-season and end-of-season dates. More detailed phenological stages, such as emergence and flowering date, are not currently represented. Incorporating these intermediate stages could improve expertise-based feature design and generate more predictive inputs for yield forecasting models.</p></list-item><list-item><label>–</label>
      <p id="d2e2720">Government-reported yield statistics can vary in quality across countries due to differences in data collection, aggregation, and reporting accuracy. For a large fraction of the data, we rely on reprocessed and curated statistics from the relevant national agencies. For quality control of these data, we refer to the relevant studies and papers that detail the validation methods applied. Where available, the data card for each country provides a link to these references. In addition, we apply basic quality checks, such as filtering out zero or missing yields and verifying internal consistency (<inline-formula><mml:math id="M55" display="inline"><mml:mrow><mml:mi mathvariant="normal">yield</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="normal">production</mml:mi><mml:mo>/</mml:mo><mml:mi mathvariant="normal">area</mml:mi></mml:mrow></mml:math></inline-formula>). Nevertheless, there is currently no universally accepted protocol for quality control or uncertainty assessment of yield data <xref ref-type="bibr" rid="bib1.bibx19" id="paren.81"/>. As such, CY-Bench does not include formal uncertainty estimates for each observation, though future iterations could incorporate quality indicators based on the source, cropping area, or other metadata.</p></list-item><list-item><label>–</label>
      <p id="d2e2743">Crop yield forecasting models could benefit from incorporating weather forecasts <xref ref-type="bibr" rid="bib1.bibx17" id="paren.82"/>. In our task definition, models cannot access data after the lead time and, therefore, cannot capture conditions that might affect the end-of-season yields after that point. In the real-life setting, forecasters would have access to weather forecasts that may provide useful information. We did not include weather forecasts in CY-Bench because the evidence supporting their usefulness is variable <xref ref-type="bibr" rid="bib1.bibx18" id="paren.83"/> and there are multiple considerations that need to be discussed before including weather forecasts: (a) Observed weather data and forecast data may originate from difference sources. (b) Some variables, e.g., <monospace>fPAR</monospace> and <monospace>NDVI</monospace>, have no forecasts. Strategies for addressing these gaps are necessary. (c) Weather forecasts from General Circulation Models (GCMs) typically have coarse spatial resolutions (50–400 km grid sizes) and often contain systematic errors or biases that must be adjusted. Bias correction and downscaling techniques must be applied using observed historical records of weather variables, such as precipitation and temperature, to adjust the climate data and better represent local conditions. (d) Using weather forecasts for yield prediction would also cause error/uncertainty propagation from the weather forecast models leading to an increase in overall uncertainty.</p></list-item></list></p></list-item><list-item><label>2.</label>
      <p id="d2e2759">CY-Bench does not differentiate between irrigated and non-irrigated systems. These systems can exhibit different responses to predictors due to varying water availability, leading to potential inaccuracies in yield forecasts. Our choice was driven by the fact that crop statistics in most countries are rarely reported separately for irrigated and non-irrigated areas.</p></list-item><list-item><label>3.</label>
      <p id="d2e2763">CY-Bench does not provide process-based crop model outputs, which could serve as valuable input features for machine learning models. Additionally, the current feature aggregation uses fixed time steps rather than adapting to crop growth stages. Access to crop model outputs, which contain information on key phenological state changes, could enable the development of more effective, stage-specific features.</p></list-item><list-item><label>4.</label>
      <p id="d2e2767">CY-Bench does not provide raw surface reflectance but includes vegetation indices (i.e. <monospace>NDVI</monospace> – the most frequently-used index for crop yield forecasting; <xref ref-type="bibr" rid="bib1.bibx94" id="altparen.84"/>, and <monospace>fPAR</monospace>), that are strongly correlated with yields <xref ref-type="bibr" rid="bib1.bibx41" id="paren.85"/>. The utility of high-resolution (10–60 m) satellite images (considering spatial information without aggregating to administrative units as performed in CY-Bench) for crop yield forecasting at the sub-national level will result in a massive data size. In addition, the temporal availability of such data is not very long (e.g., Sentinel available since 2014/2015). Meanwhile, moderate-resolution satellite images have been used to forecast crop yields in the United States (e.g., <xref ref-type="bibr" rid="bib1.bibx123" id="altparen.86"/>), demonstrating an advantage over time series data. Future work could investigate the value of satellite images for sub-national crop yield forecasting at a global level.</p></list-item><list-item><label>5.</label>
      <p id="d2e2786">Finally, the LOYO method of evaluation is used due to small data sizes in many countries. This approach assumes that all years are independent, which may be too strong of an assumption if consecutive years have correlated environmental and climatic conditions. Also, management strategies might affect multiple seasons; for example, there is evidence of the impact of crop rotation from a previous season on yields <xref ref-type="bibr" rid="bib1.bibx51" id="paren.87"/>. While LOYO is a practical compromise for smaller datasets (allowing maximum use of available training data while ensuring each year is evaluated), regions with larger datasets could benefit from forward sliding (rolling-window) validation, which better mimics operational forecasting.</p></list-item></list></p>
</sec>
<sec id="Ch1.S4.SS3">
  <label>4.3</label><title>Advancing earth system modeling</title>
      <p id="d2e2800">We noted a distinct lack of benchmark datasets for agricultural yield forecasting. Still, many recent developments in the related field of crop type mapping using satellite data <xref ref-type="bibr" rid="bib1.bibx90 bib1.bibx109 bib1.bibx122 bib1.bibx49" id="paren.88"/> are leading to exciting progress in the development of methods for extracting meaningful patterns from time series of earth observation data <xref ref-type="bibr" rid="bib1.bibx91 bib1.bibx90 bib1.bibx79 bib1.bibx93" id="paren.89"/>. Similarly, some studies have shown improved model performance for land cover classification, crop mapping and agricultural yield forecasting using meta-learning and multitask learning <xref ref-type="bibr" rid="bib1.bibx110 bib1.bibx108 bib1.bibx47" id="paren.90"/>. CY-Bench includes time series of crop productivity or vegetation health indicators from earth observation as predictors, and can therefore be combined with existing crop mapping benchmark datasets to explore such approaches.</p>
      <p id="d2e2812">Apart from the downstream task of pre-harvest yield forecasting, CY-Bench enables explorations in transfer learning, domain adaptation, and representation learning to assess whether models can generalize well across diverse geographic and climatic conditions. We envision at least four directions for future research. First, transfer learning methods can be explored to improve model generalization ability when training on data-rich regions and deploying to data-sparse regions <xref ref-type="bibr" rid="bib1.bibx50 bib1.bibx16 bib1.bibx73" id="paren.91"/>. Second, self-supervised learning could be used to harness the vast amounts of unlabeled agricultural data available <xref ref-type="bibr" rid="bib1.bibx119 bib1.bibx121" id="paren.92"/>. By training models to recognize patterns and structures within this data, we can build robust representations that capture essential features of agricultural systems. These representations can then be fine-tuned using the labeled datasets in CY-Bench specific to each country or crop. For instance, a self-supervised model trained on satellite images and environmental data can later be fine-tuned to predict specific crop yields in various regions, making it a powerful tool for global agricultural analysis. Third, another important area is to explore the stability of model predictions against natural and human interventions. This involves understanding how factors like extreme weather events, policy changes, or management practices impact yield forecasts. Causal invariance learning focuses on identifying and utilizing stable variables across different environments to ensure robustness and generalization <xref ref-type="bibr" rid="bib1.bibx70 bib1.bibx72" id="paren.93"/>. For example, soil quality and basic climatic factors like temperature and precipitation may have stable relationships with crop yields. By recognizing variables that consistently impact crop yields regardless of geographic or climatic differences, it may be possible to build models that are resilient to distributional shifts and perform reliably across diverse conditions.</p>
</sec>
</sec>
<sec id="Ch1.S5">
  <label>5</label><title>Code and data availability</title>
      <p id="d2e2834">The complete code base encompassing data pre-processing, tools for model construction, training, evaluation, and data/metric visualization routines is available through our publicly accessible Zenodo repository: <ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link> <xref ref-type="bibr" rid="bib1.bibx43" id="paren.94"/>. A summarizing overview can be found on <uri>https://cybench.agml.org/</uri> (last access: 30 May 2026). We additionally provide a Python package <monospace>cybench</monospace> that can be installed via the repository to load the dataset and run CY-Bench. The dataset is available in Zenodo at <ext-link xlink:href="https://doi.org/10.5281/zenodo.11502142" ext-link-type="DOI">10.5281/zenodo.11502142</ext-link> <xref ref-type="bibr" rid="bib1.bibx42" id="paren.95"/> and is comprehensively documented using the framework of Data Cards. Each individual dataset subset is accompanied by a dedicated Data Card located within the data_preparation (<ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>) directory of our repository <xref ref-type="bibr" rid="bib1.bibx43" id="paren.96"/>. The CY-Bench dataset and the python library are licensed under EUPL-1.2 (<uri>https://joinup.ec.europa.eu/collection/eupl/eupl-text-eupl-12</uri>, last access: 30 May 2026), which is compatible with all of the licenses for the datasets included.</p>
</sec>
<sec id="Ch1.S6" sec-type="conclusions">
  <label>6</label><title>Conclusions</title>
      <p id="d2e2873">Innovative, data-driven approaches are crucial for enhancing the resilience of food systems to climate change and extreme events, which is essential for achieving the United Nations' Sustainable Development Goal 2 of Zero Hunger <xref ref-type="bibr" rid="bib1.bibx97" id="paren.97"/>. By providing a well-curated dataset designed for the consistent development and evaluation of large-scale crop yield predictions, CY-Bench is a step forward in improving the accuracy of yield forecasting. Curated by an interdisciplinary group of experts in agronomy, food security, climate science and agriculture, this dataset can facilitate increased collaboration between fields and ultimately help to produce reliable crop yield forecasts to support the decisions of farmers, policymakers and commodity traders worldwide. In summary, with CY-Bench we aim to contribute to advancing earth system sciences by providing a critical resource for modeling the effects of climate change, extreme events, and environmental variability on crop yields, while also supporting machine learning research in time series forecasting, transfer learning, and domain adaptation techniques.</p>
</sec>

      
      </body>
    <back><app-group>

<app id="App1.Ch1.S1">
  <label>Appendix A</label><title>Sensitivity Analysis of Static vs. Dynamic Crop Masks</title>
      <p id="d2e2890">A primary challenge in global-scale benchmarking is the trade-off between spatial resolution and temporal consistency in crop masks. CY-Bench utilizes a static, high-resolution (<inline-formula><mml:math id="M56" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 0.5 km) crop mask. To assess the potential error introduced by neglecting year-to-year changes in cropped area (e.g., due to rotation or fallowing), we performed a sensitivity analysis using the dynamic, but coarser (<inline-formula><mml:math id="M57" display="inline"><mml:mo lspace="0mm">∼</mml:mo></mml:math></inline-formula> 10 km), MIRCA-OS dataset <xref ref-type="bibr" rid="bib1.bibx46" id="paren.98"/>.</p>
      <p id="d2e2910">We isolated the “mask effect” by calculating the regional aggregate of a vegetation indicator (<monospace>fPAR</monospace>) in two ways for over 12 000 administrative regions: <list list-type="order"><list-item>
      <p id="d2e2918">Signal Variance: The crop mask is held constant, while the vegetation signal varies according to its observed interannual dynamics.</p></list-item><list-item>
      <p id="d2e2922">Mask Variance: The vegetation signal is held constant at its climatological mean, isolating the variability driven solely by annual changes in the crop mask (using MIRCA-OS 2000–2015).</p></list-item></list></p>
      <p id="d2e2925">The analysis revealed that the variability driven by mask changes is significantly lower than the natural interannual variability of the crop signal. Specifically, the median relative variability (defined as the ratio of mask-induced standard deviation to signal-induced standard deviation) was approximately 2 % across all regions.</p>
      <p id="d2e2928">These results confirm that at the sub-national aggregation level used in CY-Bench, the error introduced by using a static mask is negligible relative to the signal of interest. Furthermore, the use of a static mask avoids the mixed-pixel bias inherent in coarser dynamic products.</p><fig id="FA1"><label>Figure A1</label><caption><p id="d2e2934">Comparison of variability driven by natural interannual signal fluctuations versus crop mask evolution. The colored lines represent the indicator trajectories if only the crop mask changed (using MIRCA-OS dynamic masks), while the blue envelope represents the interannual variability of the signal with a static mask. The vertical spread of the mask effect is minor compared to the natural interannual variation of the signal, showing that the error introduced by using a static mask is negligible relative to the signal of interest.</p></caption>
        
        <graphic xlink:href="https://essd.copernicus.org/articles/18/3997/2026/essd-18-3997-2026-f04.png"/>

      </fig>

</app>
  </app-group><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e2949">MK: Project administration, Software, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e2952">DP: Conceptualization, Methodology, Project administration, Investigation, Software, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e2955">SOA: Data curation, Software, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e2958">HB: Investigation, Software, Visualization, Writing – review &amp; editing.</p>

      <p id="d2e2961">RVB: Software, Validation, Writing – review &amp; editing.</p>

      <p id="d2e2965">AP: Software, Validation, Writing – review &amp; editing.</p>

      <p id="d2e2968">PP: Data curation, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e2971">AS: Data curation, Validation, Writing – review &amp; editing.</p>

      <p id="d2e2974">WA: Data curation, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e2977">MVB: Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e2980">AC: Validation, Writing – review &amp; editing.</p>

      <p id="d2e2984">OE: Data curation, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e2987">RH: Data curation, Project administration, Validation, Writing – review &amp; editing.</p>

      <p id="d2e2990">RL: Data curation, Validation, Writing – review &amp; editing.</p>

      <p id="d2e2993">DL: Data curation, Validation, Writing – review &amp; editing.</p>
    

      <p id="d2e2998">IL: Data curation.</p>

      <p id="d2e3003">DM: Software, Validation.</p>

      <p id="d2e3006">MM:  Data curation, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3009">JMM: Data curation, Writing – review &amp; editing.</p>

      <p id="d2e3012">SM: Data curation, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3015">JR: Data curation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3018">ACR: Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3022">RS: Data curation, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3025">GS: Data curation, Validation, Writing – review &amp; editing.</p>

      <p id="d2e3028">VS: Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3031">RDSNJ: Data curation, Validation, Writing – review &amp; editing.</p>

      <p id="d2e3034">AKS: Data curation, Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3037">RS: Writing – original draft preparation, Manuscript writing and review.</p>

      <p id="d2e3041">LS: Validation, Writing – original draft preparation, Writing – review &amp; editing.</p>

      <p id="d2e3044">PV: Data curation, Validation, Writing – review &amp; editing.</p>

      <p id="d2e3047">ADW: Data curation, Validation, Writing – review &amp; editing.</p>

      <p id="d2e3050">MZ: Data curation, Validation, Writing – review &amp; editing.</p>

      <p id="d2e3053">INA: Funding acquisition, Supervision, Validation, Writing – review &amp; editing.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e3059">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e3065">Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. The authors bear the ultimate responsibility for providing appropriate place names. Views expressed in the text are those of the authors and do not necessarily reflect the views of the publisher.</p>
  </notes><ack><title>Acknowledgements</title><p id="d2e3071">CY-Bench benefited from many helpful discussions with the participants of AgML (<uri>https://www.agml.org</uri>, last access: 30 May 2026), the Machine Learning team of the Agricultural Model Intercomparison and Improvement Project (AgMIP, <uri>http://www.agmip.org</uri>, last access: 30 May 2026).</p><p id="d2e3079">We would also like to acknowledge the contributions of Marc Russwurm, Afef Marzougui, Hendrik Boogaard, Marijn van der Velde, Steven Hoek, Filip Szabo, Francesco Collivignarelli, Xiaomao Lin, Toshi Iizumi, Peng Fu, Prakriti Bista, Paresh Shirsath, Soora Naresh Kumar, Sibiri Traore and Javier Garcia Navarro in the design and implementation of the benchmark and preparation of the manuscript.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e3084">This work was partially supported by the WUR Research Investment Theme on Data-Driven Discoveries in a Changing Climate, and the Digital Europe Programme under Grant agreement AgrifoodTEF – Test and Experiment Facilities for the Agri-Food Domain (ID 101100622).</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e3090">This paper was edited by Yun Yang and reviewed by two anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bibx1"><label>Ambikapathi et al.(2022)Ambikapathi, Schneider, Davis, Herrero, Winters, and Fanzo</label><mixed-citation>Ambikapathi, R., Schneider, K. R., Davis, B., Herrero, M., Winters, P., and Fanzo, J. C.: Global food systems transitions have enabled affordable diets but had less favourable outcomes for nutrition, environmental health, inclusion and equity, Nature Food, 3, 764–779, <ext-link xlink:href="https://doi.org/10.1038/s43016-022-00588-7" ext-link-type="DOI">10.1038/s43016-022-00588-7</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx2"><label>Argentina(2016)</label><mixed-citation>Argentina: Ministerio de Agrícultura, Ganaderia y Pesca. “Estimaciones Agrícolas”, <uri>https://datosestimaciones.magyp.gob.ar/reportes.php?reporte=Estimaciones</uri> (last access: 29 April 2016), 2016.</mixed-citation></ref>
      <ref id="bib1.bibx3"><label>Australia(2024)</label><mixed-citation>Australia: ABARES. Australian Bureau of Agricultural and Resource Economics and Sciences Farm Data Portal, <uri>https://www.agriculture.gov.au/abares/data/farm-data-portal#data-download</uri> (last access: 5 March 2024), 2024.</mixed-citation></ref>
      <ref id="bib1.bibx4"><label>Basso and Liu(2019)</label><mixed-citation>Basso, B. and Liu, L.: Seasonal crop yield forecast: Methods, applications, and accuracies, Adv. Agron.,  154, 201–255, <ext-link xlink:href="https://doi.org/10.1016/bs.agron.2018.11.002" ext-link-type="DOI">10.1016/bs.agron.2018.11.002</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx5"><label>Batjes(2016)</label><mixed-citation>Batjes, N. H.: Harmonized soil property values for broad-scale modelling (WISE30sec) with estimates of global soil carbon stocks, Geoderma, 269, 61–68, <ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2016.01.034" ext-link-type="DOI">10.1016/j.geoderma.2016.01.034</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bibx6"><label>Becker-Reshef et al.(2020)Becker-Reshef, Justice, Barker, Humber, Rembold, Bonifacio, Zappacosta, Budde, Magadzire, Shitote, Pound, Constantino, Nakalembe, Mwangi, Sobue, Newby, Whitcraft, Jarvis, and Verdin</label><mixed-citation>Becker-Reshef, I., Justice, C., Barker, B., Humber, M., Rembold, F., Bonifacio, R., Zappacosta, M., Budde, M., Magadzire, T., Shitote, C., Pound, J., Constantino, A., Nakalembe, C., Mwangi, K., Sobue, S., Newby, T., Whitcraft, A., Jarvis, I., and Verdin, J.: Strengthening agricultural decisions in countries at risk of food insecurity: The GEOGLAM Crop Monitor for Early Warning, Remote Sens. Environ., 237, 111553, <ext-link xlink:href="https://doi.org/10.1016/j.rse.2019.111553" ext-link-type="DOI">10.1016/j.rse.2019.111553</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx7"><label>Becker-Reshef et al.(2023)Becker-Reshef, Barker, Whitcraft, Oliva, Mobley, Justice, and Sahajpal</label><mixed-citation>Becker-Reshef, I., Barker, B., Whitcraft, A., Oliva, P., Mobley, K., Justice, C., and Sahajpal, R.: Crop type maps for operational global agricultural monitoring, Sci. Data, 10, 172, <ext-link xlink:href="https://doi.org/10.1038/s41597-023-02047-9" ext-link-type="DOI">10.1038/s41597-023-02047-9</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx8"><label>Benos et al.(2021)Benos, Tagarakis, Dolias, Berruto, Kateris, and Bochtis</label><mixed-citation>Benos, L., Tagarakis, A. C., Dolias, G., Berruto, R., Kateris, D., and Bochtis, D.: Machine learning in agriculture: A comprehensive updated review, Sensors, 21, 3758, <ext-link xlink:href="https://doi.org/10.3390/s21113758" ext-link-type="DOI">10.3390/s21113758</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx9"><label>Boogaard et al.(2022)Boogaard, Schubert, De Wit, Lazebnik, Hutjes, and Van der Grijn</label><mixed-citation>Boogaard, H., Schubert, J., De Wit, A., Lazebnik, J., Hutjes, R., and Van der Grijn, G.: Agrometeorological indicators from 1979 to present derived from reanalysis, Climate Data Store – Copernicus Climate Change Service, <ext-link xlink:href="https://doi.org/10.24381/cds.6c68c9bb" ext-link-type="DOI">10.24381/cds.6c68c9bb</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx10"><label>Boryan et al.(2011)Boryan, Yang, Mueller, and Craig</label><mixed-citation> Boryan, C., Yang, Z., Mueller, R., and Craig, M.: Monitoring US agriculture: the US department of agriculture, national agricultural statistics service, cropland data layer program, Geocarto Int., 26, 341–358, 2011.</mixed-citation></ref>
      <ref id="bib1.bibx11"><label>Brazil(2022)</label><mixed-citation>Brazil: IBGE SIDRA. “Tabela 1612: Área plantada, área colhida, quantidade produzida, rendimento médio e valor da produção das lavouras temporárias”, <uri>https://sidra.ibge.gov.br/tabela/1612</uri> (last access: 6 February 2024), 2022.</mixed-citation></ref>
      <ref id="bib1.bibx12"><label>Burnell et al.(2023)Burnell, Schellaert, Burden, Ullman, Martinez-Plumed, Tenenbaum, Rutar, Cheke, Sohl-Dickstein, Mitchell, Kiela, Shanahan, Voorhees, Cohn, Leibo, and Hernandez-Orallo</label><mixed-citation>Burnell, R., Schellaert, W., Burden, J., Ullman, T. D., Martinez-Plumed, F., Tenenbaum, J. B., Rutar, D., Cheke, L. G., Sohl-Dickstein, J., Mitchell, M., Kiela, D., Shanahan, M., Voorhees, E. M., Cohn, A. G., Leibo, J. Z., and Hernandez-Orallo, J.: Rethink reporting of evaluation results in AI, Science, 380, 136–138, <ext-link xlink:href="https://doi.org/10.1126/science.adf6369" ext-link-type="DOI">10.1126/science.adf6369</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx13"><label>Chen and Villoria(2022)</label><mixed-citation>Chen, B. and Villoria, N. B.: Foreign yield shocks and domestic price variability: the case of maize in developing countries, Environ. Res. Lett., 17, 124044, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/aca7d5" ext-link-type="DOI">10.1088/1748-9326/aca7d5</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx14"><label>China(2024)</label><mixed-citation>China: National Bureau of Statistics of China, National Data Portal, <uri>https://data.stats.gov.cn</uri> (last access: 18 February 2024), 2024.</mixed-citation></ref>
      <ref id="bib1.bibx15"><label>Chlingaryan et al.(2018)Chlingaryan, Sukkarieh, and Whelan</label><mixed-citation>Chlingaryan, A., Sukkarieh, S., and Whelan, B.: Machine learning approaches for crop yield prediction and nitrogen status estimation in precision agriculture: A review, Comput. Electron. Agr., 151, 61–69, <ext-link xlink:href="https://doi.org/10.1016/j.compag.2018.05.012" ext-link-type="DOI">10.1016/j.compag.2018.05.012</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx16"><label>Coulibaly et al.(2019)Coulibaly, Kamsu-Foguem, Kamissoko, and Traore</label><mixed-citation> Coulibaly, S., Kamsu-Foguem, B., Kamissoko, D., and Traore, D.: Deep neural networks with transfer learning in millet crop images, Comput. Ind., 108, 115–120, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx17"><label>Cunha et al.(2018)Cunha, Silva, and Netto</label><mixed-citation>Cunha, R. L., Silva, B., and Netto, M. A.: A scalable machine learning system  for pre-season agriculture yield forecast, in: 2018 IEEE 14th international  conference on e-science (e-Science), IEEE, 423–430, <ext-link xlink:href="https://doi.org/10.1109/eScience.2018.00131" ext-link-type="DOI">10.1109/eScience.2018.00131</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx18"><label>Darbyshire et al.(2020)Darbyshire, Crean, Cashen, Anwar, Broadfoot, Simpson, Cobon, Pudmenzky, Kouadio, and Kodur</label><mixed-citation>Darbyshire, R., Crean, J., Cashen, M., Anwar, M. R., Broadfoot, K. M., Simpson, M., Cobon, D. H., Pudmenzky, C., Kouadio, L., and Kodur, S.: Insights into the value of seasonal climate forecasts to agriculture, Aust. J. Agr. Resour. Ec., 64, 1034–1058, <ext-link xlink:href="https://doi.org/10.1111/1467-8489.12389" ext-link-type="DOI">10.1111/1467-8489.12389</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx19"><label>Davis et al.(2025)</label><mixed-citation>Davis, K. F., Anderson, W., Ehrmann, S., Flach, R., Meyer, C., Proctor, J.,  Ray, D. K., You, L., Foley, M., Kerdiles, H., Hultgren, A., Huybers, P., Kebede, E., Meroni, M., Park, C., and Lee, D.: HarvestStat: A global  effort towards open and standardized sub-national agricultural data,  Environ. Res. Lett., 20, 052001, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/adcb54" ext-link-type="DOI">10.1088/1748-9326/adcb54</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx20"><label>Duden et al.(2024)Duden, Nacke, and Offermann</label><mixed-citation>Duden, C., Nacke, C., and Offermann, F.: German yield and area data for 11 crops from 1979 to 2021 at a harmonized spatial resolution of 397 districts, Sci. Data, 11, <ext-link xlink:href="https://doi.org/10.1038/s41597-024-02951-8" ext-link-type="DOI">10.1038/s41597-024-02951-8</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx21"><label>Dueben et al.(2022)Dueben, Schultz, Chantry, Gagne, Hall, and McGovern</label><mixed-citation>Dueben, P. D., Schultz, M. G., Chantry, M., Gagne, D. J., Hall, D. M., and McGovern, A.: Challenges and Benchmark Datasets for Machine Learning in the Atmospheric Sciences: Definition, Status, and Outlook, Artificial Intelligence for the Earth Systems, 1, <ext-link xlink:href="https://doi.org/10.1175/AIES-D-21-0002.1" ext-link-type="DOI">10.1175/AIES-D-21-0002.1</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx22"><label>EC-JRC(2024)</label><mixed-citation> EC-JRC: Elaboration of Van Tricht et al, 2023, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx23"><label>Ennaji et al.(2023)Ennaji, Vergutz, and El Allali</label><mixed-citation>Ennaji, O., Vergutz, L., and El Allali, A.: Machine learning in nutrient management: A review, Artificial Intelligence in Agriculture, 9, 1–11, <ext-link xlink:href="https://doi.org/10.1016/j.aiia.2023.06.001" ext-link-type="DOI">10.1016/j.aiia.2023.06.001</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx24"><label>Ennaji et al.(2024)Ennaji, Baha, Vergutz, and El Allali</label><mixed-citation>Ennaji, O., Baha, S., Vergutz, L., and El Allali, A.: Gradient boosting for yield prediction of elite maize hybrid ZhengDan 958, PloS One, 19, e0315493, <ext-link xlink:href="https://doi.org/10.1371/journal.pone.0315493" ext-link-type="DOI">10.1371/journal.pone.0315493</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx25"><label>Fan et al.(2022)Fan, Bai, Li, Ortiz-Bobea, and Gomes</label><mixed-citation>Fan, J., Bai, J., Li, Z., Ortiz-Bobea, A., and Gomes, C.: A GNN-RNN Approach for Harnessing Geospatial and Temporal Information: Application to Crop Yield Prediction, Proceedings of the AAAI Conference on Artificial Intelligence, 36, 11873–11881, <ext-link xlink:href="https://doi.org/10.1609/aaai.v36i11.21444" ext-link-type="DOI">10.1609/aaai.v36i11.21444</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx26"><label>Fanzo(2024)</label><mixed-citation>Fanzo, J.: Kicking around in the wreck, PLOS Climate, 3, e0000401, <ext-link xlink:href="https://doi.org/10.1371/journal.pclm.0000401" ext-link-type="DOI">10.1371/journal.pclm.0000401</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx27"><label>FAO(2025)</label><mixed-citation>FAO: Crop Calendar Food and Agriculture Organization of the United Nations, <uri>https://cropcalendar.apps.fao.org</uri> (last access: 11 February 2025), 2025.</mixed-citation></ref>
      <ref id="bib1.bibx28"><label>Fernandez-Beltran et al.(2021)Fernandez-Beltran, Baidar, Kang, and Pla</label><mixed-citation>Fernandez-Beltran, R., Baidar, T., Kang, J., and Pla, F.: Rice-Yield Prediction with Multi-Temporal Sentinel-2 Data and 3D CNN: A Case Study in Nepal, Remote Sensing, 13, 1391, <ext-link xlink:href="https://doi.org/10.3390/rs13071391" ext-link-type="DOI">10.3390/rs13071391</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx29"><label>Franch et al.(2022)</label><mixed-citation>Franch, B., Cintas, J., Becker-Reshef, I., Sanchez-Torres, M. J., Roger, J.,  Skakun, S., Sobrino, J. A., Van Tricht, K., Degerickx, J., Gilliams, S.,  Koetz, B., Szantoi, Z., and Whitcraft, A.: Global crop calendars of maize and wheat in the framework of the WorldCereal project, GISci. Remote Sens., 59, 885–913, <ext-link xlink:href="https://doi.org/10.1080/15481603.2022.2079273" ext-link-type="DOI">10.1080/15481603.2022.2079273</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx30"><label>Frieler et al.(2017)</label><mixed-citation>Frieler, K., Schauberger, B., Arneth, A., Balkovič, J.,  Chryssanthacopoulos, J., Deryng, D., Elliott, J., Folberth, C., Khabarov, N.,  Müller, C., Olin, S., Pugh, T.A.M., Schaphoff, S., Schewe, J., Schmid, E., Warszawski, L., andLevermann, A.: Understanding the weather signal in national crop-yield variability, Earth's Future, 5, 605–616, <ext-link xlink:href="https://doi.org/10.1002/2016EF000525" ext-link-type="DOI">10.1002/2016EF000525</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx31"><label>Gavasso-Rita et al.(2023)Gavasso-Rita, Papalexiou, Li, Elshorbagy, Li, and Schuster-Wallace</label><mixed-citation>Gavasso-Rita, Y. L., Papalexiou, S. M., Li, Y., Elshorbagy, A., Li, Z., and Schuster-Wallace, C.: Crop models and their use in assessing crop production and food security: A review, Food and Energy Security, 13, e503, <ext-link xlink:href="https://doi.org/10.1002/fes3.503" ext-link-type="DOI">10.1002/fes3.503</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx32"><label>Good and Irwin(2003)</label><mixed-citation>Good, D. L. and Irwin, S. H.: Understanding USDA corn and soybean production  forecasts: An overview of methods, performance and market impacts, <ext-link xlink:href="https://doi.org/10.22004/ag.econ.37496" ext-link-type="DOI">10.22004/ag.econ.37496</ext-link>, 2003.</mixed-citation></ref>
      <ref id="bib1.bibx33"><label>Hatfield and Prueger(2015)</label><mixed-citation> Hatfield, J. L. and Prueger, J. H.: Temperature extremes: Effect on plant growth and development, Weather and Climate Extremes, 10, 4–10, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx34"><label>He et al.(2017)He, Wang, Wang, and Robertson</label><mixed-citation>He, D., Wang, E., Wang, J., and Robertson, M.: Data requirement for effective calibration of process-based crop models, Agr. Forest Meteorol., 234–235, 136–148, <ext-link xlink:href="https://doi.org/10.1016/j.agrformet.2016.12.015" ext-link-type="DOI">10.1016/j.agrformet.2016.12.015</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx35"><label>Hengl et al.(2017)</label><mixed-citation>Hengl, T., Mendes de Jesus, J., Heuvelink, G. B., Ruiperez Gonzalez, M., Kilibarda, M., Blagotić, A., Shangguan, W., Wright, M. N., Geng, X., Bauer-Marschallinger, B., Guevara, M. A., Vargas, R., MacMillan, R. A., Batjes, N. H., Leenaars, J. G. B., Ribeiro, E., Wheeler, I., Mantel, S., and Kempen, B.: SoilGrids250m: Global gridded soil information based on machine learning, PLoS One, 12, e0169748, <ext-link xlink:href="https://doi.org/10.1371/journal.pone.0169748" ext-link-type="DOI">10.1371/journal.pone.0169748</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx36"><label>Hoffmann et al.(2016)</label><mixed-citation>Hoffmann, H., Zhao, G., Asseng, S., Bindi, M., Biernath, C., Constantin, J.,  Coucheney, E., Dechow, R., Doro, L., Eckersten, H., Gaiser, T., Grosz, B., Heinlein, F., Kassie, B. T., Kersebaum, K.-C., Klein, C., Kuhnert, M., Lewan, E., Moriondo, M., Nendel, C., Priesack, E., Raynal, H., Roggero, P. P., Rötter, R. P., Siebert, S., Specka, X., Tao, F., Teixeira, E., Trombi, G., Wallach, D., Weihermüller, L., Yeluripati, J., and Ewert, F.: Impact of spatial soil and climate input data aggregation on regional yield simulations, PloS One, 11, e0151782, <ext-link xlink:href="https://doi.org/10.1371/journal.pone.0151782" ext-link-type="DOI">10.1371/journal.pone.0151782</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bibx37"><label>Höhl et al.(2023)Höhl, Ofori-Ampofo, Obadic, Fernández-Torres, Salih Kuzu, and Zhu</label><mixed-citation>Höhl, A., Ofori-Ampofo, S., Obadic, I., Fernández-Torres, M.-Á., Salih Kuzu, R., and Zhu, X.: USCC: A Benchmark Dataset for Crop Yield Prediction under Climate Extremes, EGU General Assembly 2023, Vienna, Austria, 23–28 Apr 2023, EGU23-15540, <ext-link xlink:href="https://doi.org/10.5194/egusphere-egu23-15540" ext-link-type="DOI">10.5194/egusphere-egu23-15540</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx38"><label>Huete et al.(2002)Huete, Didan, Miura, Rodriguez, Gao, and Ferreira</label><mixed-citation> Huete, A., Didan, K., Miura, T., Rodriguez, E. P., Gao, X., and Ferreira, L. G.: Overview of the radiometric and biophysical performance of the MODIS vegetation indices, Remote Sens. Environ., 83, 195–213, 2002.</mixed-citation></ref>
      <ref id="bib1.bibx39"><label>ICRISAT Mali(2018)</label><mixed-citation>ICRISAT Mali: Compagnie Malienne pour le Developpement des Textiles (CMDT)  Monitoring Operational Maize Yield Statistics, <uri>http://data.icrisat.org/dataverse/</uri> (last access: 30 May 2026), 2018.</mixed-citation></ref>
      <ref id="bib1.bibx40"><label>India(2024)</label><mixed-citation>India: ICRISAT. District Level Database, <uri>http://data.icrisat.org/dld/src/crops.html</uri> (last access:  9 February 2024), 2024.</mixed-citation></ref>
      <ref id="bib1.bibx41"><label>Johnson(2016)</label><mixed-citation>Johnson, D. M.: A comprehensive assessment of the correlations between field crop yields and commonly used MODIS products, Int. J. Appl. Earth Obs., 52, 65–81, <ext-link xlink:href="https://doi.org/10.1016/j.jag.2016.05.010" ext-link-type="DOI">10.1016/j.jag.2016.05.010</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bibx42"><label>Kallenberg et al.(2025)</label><mixed-citation>Kallenberg, M., Paudel, D., Ofori-Ampofo, S., Baja, H., van Bree, R., Potze,  A., Poudel, P., Saleh, A., Anderson, W., von Bloh, M., Castellano, A.,  Ennaji, O., Hamed, R., Laudien, R., Lee, D., Luna, I., Masiliūnas, D.,  Meroni, M., Mutuku, J. M., Mkuhlani, S., Richetti, J., Ruane, A. C.,  Sahajpal, R., Shuai, G., Sitokonstantinou, V., de Souza Noia Junior, R.,  Srivastava, A. K., Strong, R., Sweet, L.-b., Vojnović, P., de Wit, A.,  Zachow, M., and Athanasiadis, I. N.: CY-Bench: A comprehensive benchmark  dataset for subnational crop yield forecasting, Zenodo [data set],  <ext-link xlink:href="https://doi.org/10.5281/zenodo.11502142" ext-link-type="DOI">10.5281/zenodo.11502142</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx43"><label>Kallenberg et al.(2026)</label><mixed-citation>Kallenberg, M., Paudel, D., Ofori-Ampofo, S., Baja, H., van Bree, R., Potze, A., Poudel, P., Saleh, A., Anderson, W., von Bloh, M., Castellano, A., Ennaji, O., Hamed, R., Laudien, R., Lee, D., Luna, I., Masiliunas, D., Meroni, M., Mutuku, J. M., Mkuhlani, S., Richetti, J., Ruane, A. C., Sahajpal, R., Shuai, G., Sitokonstantinou, V., de Souza Noia Junior, R., Srivastava, A. K., Strong, R., Sweet, L.-b., Vojnovic, P., de Wit, A., Zachow, M., and Athanasiadis, I. N. : WUR-AI/AgMLCY-Bench: CY-Bench v1.0.0: ESSD paper, Zenodo [code], <ext-link xlink:href="https://doi.org/10.5281/zenodo.20456375" ext-link-type="DOI">10.5281/zenodo.20456375</ext-link>, 2026</mixed-citation></ref>
      <ref id="bib1.bibx44"><label>Kamilaris and Prenafeta-Boldú(2018)</label><mixed-citation>Kamilaris, A. and Prenafeta-Boldú, F. X.: Deep learning in agriculture: A survey, Comput. Electron. Agr., 147, 70–90, <ext-link xlink:href="https://doi.org/10.1016/j.compag.2018.02.016" ext-link-type="DOI">10.1016/j.compag.2018.02.016</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx45"><label>Kapoor and Narayanan(2023)</label><mixed-citation>Kapoor, S. and Narayanan, A.: Leakage and the reproducibility crisis in machine-learning-based science, Patterns, 4, 100804, <ext-link xlink:href="https://doi.org/10.1016/j.patter.2023.100804" ext-link-type="DOI">10.1016/j.patter.2023.100804</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx46"><label>Kebede et al.(2025)Kebede, Oluoch, Siebert, Mehta, Hartman, Jägermeyr, Ray, Ali, Brauman, Deng et al.</label><mixed-citation>Kebede, E. A., Oluoch, K. O., Siebert, S., Mehta, P., Hartman, S.,  Jägermeyr, J., Ray, D., Ali, T., Brauman, K. A., Deng, Q., Xie, W., and Davis, K. F.: A global open-source dataset of monthly irrigated and rainfed cropped areas (MIRCA-OS) for the 21st century, Sci. Data, 12, 208, <ext-link xlink:href="https://doi.org/10.1038/s41597-024-04313-w" ext-link-type="DOI">10.1038/s41597-024-04313-w</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx47"><label>Kerner et al.(2020)Kerner, Tseng, Becker-Reshef, Nakalembe, Barker, Munshell, Paliyam, and Hosseini</label><mixed-citation>Kerner, H., Tseng, G., Becker-Reshef, I., Nakalembe, C., Barker, B., Munshell, B., Paliyam, M., and Hosseini, M.: Rapid Response Crop Maps in Data Sparse Regions, in: ACM SIGKDD Conference on Data Mining and Knowledge Discovery Workshops, arXiv, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2006.16866" ext-link-type="DOI">10.48550/arXiv.2006.16866</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx48"><label>Khaki et al.(2020)Khaki, Wang, and Archontoulis</label><mixed-citation>Khaki, S., Wang, L., and Archontoulis, S. V.: A CNN-RNN framework for crop yield prediction, Front. Plant Sci., 10, 1750, <ext-link xlink:href="https://doi.org/10.3389/fpls.2019.01750" ext-link-type="DOI">10.3389/fpls.2019.01750</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx49"><label>Kondmann et al.(2021)Kondmann, Toker, Ruß wurm, Camero, Peressuti, Milcinski, Mathieu, Longepe, Davis, Marchisio, Leal-Taixé, and Zhu</label><mixed-citation>Kondmann, L., Toker, A., Ruß wurm, M., Camero, A., Peressuti, D., Milcinski, G., Mathieu, P.-P., Longepe, N., Davis, T., Marchisio, G., Leal-Taixé, L., and Zhu, X.: DENETHOR: The DynamicEarthNET dataset for Harmonized, inter-Operable, analysis-Ready, daily crop monitoring from space, in: Proceedings of the Neural Information Processing Systems Track on Datasets and Benchmarks, edited by: Vanschoren, J. and Yeung, S., Vol. 1, Curran, <uri>https://openreview.net/pdf?id=uUa4jNMLjrL</uri> (last access: 30 May 2026), 2021.</mixed-citation></ref>
      <ref id="bib1.bibx50"><label>Koukos et al.(2024)</label><mixed-citation>Koukos, A., Jo, H.-W., Sitokonstantinou, V., Tsoumas, I., Kontoes, C., and Lee, W.-K.: Towards Global Crop Maps with Transfer Learning, in: IGARSS 2024–2024 IEEE International Geoscience and Remote Sensing Symposium, 1540–1545, IEEE, <ext-link xlink:href="https://doi.org/10.1109/IGARSS53475.2024.10641793" ext-link-type="DOI">10.1109/IGARSS53475.2024.10641793</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx51"><label>Lawes et al.(2022)Lawes, Mata, Richetti, Fletcher, and Herrmann</label><mixed-citation>Lawes, R., Mata, G., Richetti, J., Fletcher, A., and Herrmann, C.: Using remote sensing, process-based crop models, and machine learning to evaluate crop rotations across 20 million hectares in Western Australia, Agron. Sustain. Dev., 42, 120, <ext-link xlink:href="https://doi.org/10.1007/s13593-022-00851-y" ext-link-type="DOI">10.1007/s13593-022-00851-y</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx52"><label>Lecerf et al.(2019)Lecerf, Ceglar, López-Lozano, Van Der Velde, and Baruth</label><mixed-citation>Lecerf, R., Ceglar, A., López-Lozano, R., Van Der Velde, M., and Baruth, B.: Assessing the information in crop model and meteorological indicators to forecast crop yield over Europe, Agr. Syst., 168, 191–202, <ext-link xlink:href="https://doi.org/10.1016/j.agsy.2018.03.002" ext-link-type="DOI">10.1016/j.agsy.2018.03.002</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx53"><label>Lee et al.(2022)Lee, Davenport, Shukla, Husak, Funk, Harrison, McNally, Rowland, Budde, and Verdin</label><mixed-citation>Lee, D., Davenport, F., Shukla, S., Husak, G., Funk, C., Harrison, L., McNally, A., Rowland, J., Budde, M., and Verdin, J.: Maize yield forecasts for Sub-Saharan Africa using Earth Observation data and machine learning, Glob. Food Secur., 33, 100643, <ext-link xlink:href="https://doi.org/10.1016/j.gfs.2022.100643" ext-link-type="DOI">10.1016/j.gfs.2022.100643</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx54"><label>Lee et al.(2025)</label><mixed-citation>Lee, D., Anderson, W., Chen, X., Davenport, F., Shukla, S., Sahajpal, R.,  Budde, M., Rowland, J., Verdin, J., You, L., Ahouangbenon, M., Davis, K. F., Kebede, E., Ehrmann, S., Justice, C., and Meyer, C.: HarvestStat  Africa–harmonized subnational crop statistics for sub-Saharan Africa, Sci. Data, 12, 690, <ext-link xlink:href="https://doi.org/10.1038/s41597-025-05001-z" ext-link-type="DOI">10.1038/s41597-025-05001-z</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx55"><label>Lesk et al.(2022)Lesk, Anderson, Rigden, Coast, Jägermeyr, McDermid, Davis, and Konar</label><mixed-citation>Lesk, C., Anderson, W., Rigden, A., Coast, O., Jägermeyr, J., McDermid, S., Davis, K. F., and Konar, M.: Compound heat and moisture extreme impacts on global crop yields under climate change, Nat. Rev. Earth  Environ., 3, 872–889, <ext-link xlink:href="https://doi.org/10.1038/s43017-022-00368-8" ext-link-type="DOI">10.1038/s43017-022-00368-8</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx56"><label>Liakos et al.(2018)Liakos, Busato, Moshou, Pearson, and Bochtis</label><mixed-citation>Liakos, K., Busato, P., Moshou, D., Pearson, S., and Bochtis, D.: Machine learning in agriculture: A review, Sensors, 18, 2674, <ext-link xlink:href="https://doi.org/10.3390/s18082674" ext-link-type="DOI">10.3390/s18082674</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx57"><label>Liliane and Charles(2020)</label><mixed-citation>Liliane, T. N. and Charles, M. S.: Factors Affecting Yield of Crops, in: Agronomy, edited by: Amanullah, Chap. 2, IntechOpen, Rijeka, <ext-link xlink:href="https://doi.org/10.5772/intechopen.90672" ext-link-type="DOI">10.5772/intechopen.90672</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx58"><label>Lin et al.(2024)Lin, Guillot, Crawford, Zhang, Yuan, and Tzeng</label><mixed-citation>Lin, F., Guillot, K., Crawford, S., Zhang, Y., Yuan, X., and Tzeng, N.-F.: An Open and Large-Scale Dataset for Multi-Modal Climate Change-aware Crop Yield Predictions, in: Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining,  5375–5386, ACM, <ext-link xlink:href="https://doi.org/10.1145/3637528.3671536" ext-link-type="DOI">10.1145/3637528.3671536</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx59"><label>Liu et al.(2022)Liu, Yang, Mohammadi, Song, Bi, and Wang</label><mixed-citation>Liu, Q., Yang, M., Mohammadi, K., Song, D., Bi, J., and Wang, G.: Machine Learning Crop Yield Models Based on Meteorological Features and Comparison with a Process-Based Model, Artificial Intelligence for the Earth Systems, 1, <ext-link xlink:href="https://doi.org/10.1175/AIES-D-22-0002.1" ext-link-type="DOI">10.1175/AIES-D-22-0002.1</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx60"><label>López et al.(2021)López, Way, and Sadok</label><mixed-citation> López, J., Way, D. A., and Sadok, W.: Systemic effects of rising atmospheric vapor pressure deficit on plant physiology and productivity, Glob. Change Biol., 27, 1704–1720, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx61"><label>Ma et al.(2023)Ma, Yang, Huang, and Zhang</label><mixed-citation>Ma, Y., Yang, Z., Huang, Q., and Zhang, Z.: Improving the Transferability of Deep Learning Models for Crop Yield Prediction: A Partial Domain Adaptation Approach, Remote Sens., 15, <ext-link xlink:href="https://doi.org/10.3390/rs15184562" ext-link-type="DOI">10.3390/rs15184562</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx62"><label>Mateo-Sanchis et al.(2021)Mateo-Sanchis, Piles, Amorós-López, Muñoz-Marí, Adsuara, Moreno-Martínez, and Camps-Valls</label><mixed-citation>Mateo-Sanchis, A., Piles, M., Amorós-López, J., Muñoz-Marí, J., Adsuara, J. E., Moreno-Martínez, Á., and Camps-Valls, G.: Learning main drivers of crop progress and failure in Europe with interpretable machine learning, Int. J. Appl. Earth Obs., 104, 102574, <ext-link xlink:href="https://doi.org/10.1016/j.jag.2021.102574" ext-link-type="DOI">10.1016/j.jag.2021.102574</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx63"><label>Mehrabi et al.(2022)Mehrabi, Delzeit, Ignaciuk, Levers, Braich, Bajaj, Amo-Aidoo, Anderson, Balgah, Benton, Chari, Ellis, Gahi, Gaupp, Garibaldi, Gerber, Godde, Grass, Heimann, Hirons, Hoogenboom, Jain, James, Makowski, Masamha, Meng, Monprapussorn, Müller, Nelson, Newlands, Noack, Oronje, Raymond, Reichstein, Rieseberg, Rodriguez-Llanes, Rosenstock, Rowhani, Sarhadi, Seppelt, Sidhu, Snapp, Soma, Sparks, Teh, Tigchelaar, Vogel, West, Wittman, and You</label><mixed-citation>Mehrabi, Z., Delzeit, R., Ignaciuk, A., Levers, C., Braich, G., Bajaj, K., Amo-Aidoo, A., Anderson, W., Balgah, R. A., Benton, T. G., Chari, M. M., Ellis, E. C., Gahi, N. Z., Gaupp, F., Garibaldi, L. A., Gerber, J. S., Godde, C. M., Grass, I., Heimann, T., Hirons, M., Hoogenboom, G., Jain, M., James, D., Makowski, D., Masamha, B., Meng, S., Monprapussorn, S., Müller, D., Nelson, A., Newlands, N. K., Noack, F., Oronje, M., Raymond, C., Reichstein, M., Rieseberg, L. H., Rodriguez-Llanes, J. M., Rosenstock, T., Rowhani, P., Sarhadi, A., Seppelt, R., Sidhu, B. S., Snapp, S., Soma, T., Sparks, A. H., Teh, L., Tigchelaar, M., Vogel, M. M., West, P. C., Wittman, H., and You, L.: Research priorities for global food security under extreme events, One Earth, 5, 756–766, <ext-link xlink:href="https://doi.org/10.1016/j.oneear.2022.06.008" ext-link-type="DOI">10.1016/j.oneear.2022.06.008</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx64"><label>Meroni et al.(2019)Meroni, Fasbender, Rembold, Atzberger, and Klisch</label><mixed-citation>Meroni, M., Fasbender, D., Rembold, F., Atzberger, C., and Klisch, A.: Near real-time vegetation anomaly detection with MODIS NDVI: Timeliness vs. accuracy and effect of anomaly computation options, Remote Sens. Environ., 221, 508–521, <ext-link xlink:href="https://doi.org/10.1016/j.rse.2018.11.041" ext-link-type="DOI">10.1016/j.rse.2018.11.041</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx65"><label>Meroni et al.(2021)Meroni, Waldner, Seguini, Kerdiles, and Rembold</label><mixed-citation>Meroni, M., Waldner, F., Seguini, L., Kerdiles, H., and Rembold, F.: Yield forecasting with machine learning and small data: What gains for grains?, Agr. Forest Meteorol., 308, 108555, <ext-link xlink:href="https://doi.org/10.1016/j.agrformet.2021.108555" ext-link-type="DOI">10.1016/j.agrformet.2021.108555</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx66"><label>Mexico(2019)</label><mixed-citation>Mexico: INEGI. Agricultural Census and Survey Data, <uri>https://www.inegi.org.mx</uri> (last access: 10 April 2024), 2019.</mixed-citation></ref>
      <ref id="bib1.bibx67"><label>Meyer and Pebesma(2022)</label><mixed-citation>Meyer, H. and Pebesma, E.: Machine learning-based global maps of ecological variables and the challenge of assessing them, Nat. Commun., 13, 2208, <ext-link xlink:href="https://doi.org/10.1038/s41467-022-29838-9" ext-link-type="DOI">10.1038/s41467-022-29838-9</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx68"><label>Minoli et al.(2019)Minoli, Egli, Rolinski, and Müller</label><mixed-citation>Minoli, S., Egli, D. B., Rolinski, S., and Müller, C.: Modelling cropping periods of grain crops at the global scale, Global Planet. Change, 174, 35–46, <ext-link xlink:href="https://doi.org/10.1016/j.gloplacha.2018.12.013" ext-link-type="DOI">10.1016/j.gloplacha.2018.12.013</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx69"><label>Miralles et al.(2025)</label><mixed-citation>Miralles, D. G., Bonte, O., Koppa, A., Baez-Villanueva, O. M., Tronquo, E.,  Zhong, F., Beck, H. E., Hulsman, P., Dorigo, W., Verhoest, N. E., and Haghdoost, S.: GLEAM4: global land evaporation and soil moisture dataset at 0.1 resolution from 1980 to near present, Sci. Data, 12, 416, <ext-link xlink:href="https://doi.org/10.1038/s41597-025-04610-y" ext-link-type="DOI">10.1038/s41597-025-04610-y</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx70"><label>Mitrovic et al.(2020)Mitrovic, McWilliams, Walker, Buesing, and Blundell</label><mixed-citation>Mitrovic, J., McWilliams, B., Walker, J., Buesing, L., and Blundell, C.: Representation learning via invariant causal mechanisms, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2010.07922" ext-link-type="DOI">10.48550/arXiv.2010.07922</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx71"><label>Nakalembe and Kerner(2023)</label><mixed-citation>Nakalembe, C. and Kerner, H.: Considerations for AI-EO for agriculture in Sub-Saharan Africa, Environ. Res. Lett., 18, 041002, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/acc476" ext-link-type="DOI">10.1088/1748-9326/acc476</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx72"><label>Neophytides et al.(2024)</label><mixed-citation>Neophytides, S. P., Tsoumas, I., Tsalakou, A., Christoforou, M.,  Mavrovouniotis, M., Eliades, M., Papoutsa, C., Kontoes, C., and Hadjimitsis,  D. G.: Invariant learning as a pathway to robust potato yield prediction, in:  Remote Sensing for Agriculture, Ecosystems, and Hydrology XXVI, SPIE, 13191, 33–42, <ext-link xlink:href="https://doi.org/10.1117/12.3031554" ext-link-type="DOI">10.1117/12.3031554</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx73"><label>Nowakowski et al.(2021)Nowakowski, Mrziglod, Spiller, Bonifacio, Ferrari, Mathieu, Garcia-Herranz, and Kim</label><mixed-citation>Nowakowski, A., Mrziglod, J., Spiller, D., Bonifacio, R., Ferrari, I., Mathieu, P. P., Garcia-Herranz, M., and Kim, D.-H.: Crop type mapping by using transfer learning, Int. J. Appl. Earth Obs., 98, 102313, <ext-link xlink:href="https://doi.org/10.1016/j.jag.2021.102313" ext-link-type="DOI">10.1016/j.jag.2021.102313</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx74"><label>Oikonomidis et al.(2022)Oikonomidis, Catal, and Kassahun</label><mixed-citation>Oikonomidis, A., Catal, C., and Kassahun, A.: Deep learning for crop yield prediction: a systematic literature review, New Zeal. J. Crop Hort.,  1–26, <ext-link xlink:href="https://doi.org/10.1080/01140671.2022.2032213" ext-link-type="DOI">10.1080/01140671.2022.2032213</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx75"><label>Paudel et al.(2021)Paudel, Boogaard, de Wit, Janssen, Osinga, Pylianidis, and Athanasiadis</label><mixed-citation>Paudel, D., Boogaard, H., de Wit, A., Janssen, S., Osinga, S., Pylianidis, C., and Athanasiadis, I. N.: Machine learning for large-scale crop yield forecasting, Agr. Syst., 187, 103016, <ext-link xlink:href="https://doi.org/10.1016/j.agsy.2020.103016" ext-link-type="DOI">10.1016/j.agsy.2020.103016</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx76"><label>Paudel et al.(2022)Paudel, Boogaard, de Wit, van der Velde, Claverie, Nisini, Janssen, Osinga, and Athanasiadis</label><mixed-citation>Paudel, D., Boogaard, H., de Wit, A., van der Velde, M., Claverie, M., Nisini, L., Janssen, S., Osinga, S., and Athanasiadis, I. N.: Machine learning for regional crop yield forecasting in Europe, Field Crop. Res., 276, 108377, <ext-link xlink:href="https://doi.org/10.1016/j.fcr.2021.108377" ext-link-type="DOI">10.1016/j.fcr.2021.108377</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx77"><label>Paudel et al.(2023)Paudel, Marcos, de Wit, Boogaard, and Athanasiadis</label><mixed-citation>Paudel, D., Marcos, D., de Wit, A., Boogaard, H., and Athanasiadis, I. N.: A weakly supervised framework for high-resolution crop yield forecasts, Environ. Res. Lett., 18, 094062, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/acf50e" ext-link-type="DOI">10.1088/1748-9326/acf50e</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx78"><label>Paudel et al.(2023b)Paudel, Marcos, de Wit, Boogaard, and Athanasiadis</label><mixed-citation>Paudel, D. R., Marcos, D., de Wit, A., Boogaard, H., and Athanasiadis, I. N.: A weakly supervised framework for high resolution crop yield forecasts, Environ. Res. Lett., 18, 094062, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/acf50e" ext-link-type="DOI">10.1088/1748-9326/acf50e</ext-link>, 2023b.</mixed-citation></ref>
      <ref id="bib1.bibx79"><label>Pelletier et al.(2019)Pelletier, Webb, and Petitjean</label><mixed-citation>Pelletier, C., Webb, G. I., and Petitjean, F.: Temporal Convolutional Neural Network for the Classification of Satellite Image Time Series, Remote Sensing, 11, <ext-link xlink:href="https://doi.org/10.3390/rs11050523" ext-link-type="DOI">10.3390/rs11050523</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx80"><label>Poggio et al.(2021)Poggio, De Sousa, Batjes, Heuvelink, Kempen, Ribeiro, and Rossiter</label><mixed-citation>Poggio, L., de Sousa, L. M., Batjes, N. H., Heuvelink, G. B. M., Kempen, B., Ribeiro, E., and Rossiter, D.: SoilGrids 2.0: producing soil information for the globe with quantified spatial uncertainty, SOIL, 7, 217–240, <ext-link xlink:href="https://doi.org/10.5194/soil-7-217-2021" ext-link-type="DOI">10.5194/soil-7-217-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx81"><label>Portmann et al.(2010)Portmann, Siebert, and Döll</label><mixed-citation>Portmann, F. T., Siebert, S., and Döll, P.: MIRCA2000 – Global monthly irrigated and rainfed crop areas around the year 2000: A new high-resolution data set for agricultural and hydrological modeling, Global Biogeochem. Cy., 24, <ext-link xlink:href="https://doi.org/10.1029/2008GB003435" ext-link-type="DOI">10.1029/2008GB003435</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bibx82"><label>Potter(2019)</label><mixed-citation>Potter, N. A.: rnassqs: An “R” package to access agricultural data via the USDA National Agricultural Statistics Service (USDA-NASS) “Quick Stats” API, Journal of Open Source Software, 4, 1880<ext-link xlink:href="https://doi.org/10.21105/joss.01880" ext-link-type="DOI">10.21105/joss.01880</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx83"><label>Priyatikanto et al.(2023)Priyatikanto, Lu, Dash, and Sheffield</label><mixed-citation>Priyatikanto, R., Lu, Y., Dash, J., and Sheffield, J.: Improving generalisability and transferability of machine-learning-based maize yield prediction model through domain adaptation, Agr. Forest Meteorol., 341, 109652, <ext-link xlink:href="https://doi.org/10.1016/j.agrformet.2023.109652" ext-link-type="DOI">10.1016/j.agrformet.2023.109652</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx84"><label>Pushkarna et al.(2022)Pushkarna, Zaldivar, and Kjartansson</label><mixed-citation>Pushkarna, M., Zaldivar, A., and Kjartansson, O.: Data Cards: Purposeful and transparent dataset documentation for responsible AI, in: Proceedings of the 2022 ACM Conference on Fairness, Accountability, and Transparency, 1776–1826, <ext-link xlink:href="https://doi.org/10.1145/3531146.3533231" ext-link-type="DOI">10.1145/3531146.3533231</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx85"><label>Richards et al.(2023)Richards, Kirichenko, Bouchacourt, and Ibrahim</label><mixed-citation>Richards, M., Kirichenko, P., Bouchacourt, D., and Ibrahim, M.: Does Progress On Object Recognition Benchmarks Improve Real-World Generalization?, arXiv, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2307.13136" ext-link-type="DOI">10.48550/arXiv.2307.13136</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx86"><label>Richetti et al.(2023)Richetti, Diakogianis, Bender, Colaço, and Lawes</label><mixed-citation>Richetti, J., Diakogianis, F. I., Bender, A., Colaço, A. F., and Lawes, R. A.: A methods guideline for deep learning for tabular data in agriculture with a case study to forecast cereal yield, Comput. Electron. Agr., 205, 107642, <ext-link xlink:href="https://doi.org/10.1016/j.compag.2023.107642" ext-link-type="DOI">10.1016/j.compag.2023.107642</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx87"><label>Rodell et al.(2004)Rodell, Houser, Jambor, Gottschalck, Mitchell, Meng, Arsenault, Cosgrove, Radakovich, Bosilovich et al.</label><mixed-citation>Rodell, M., Houser, P., Jambor, U., Gottschalck, J., Mitchell, K., Meng, C.-J., Arsenault, K., Cosgrove, B., Radakovich, J., Bosilovich, M., Entin, J. K., Walker, J. P., Lohmann, D., and Toll, D.: The global land data assimilation system, B. Am. Meteorol. Soc., 85, 381–394, <ext-link xlink:href="https://doi.org/10.1175/BAMS-85-3-381" ext-link-type="DOI">10.1175/BAMS-85-3-381</ext-link>, 2004.</mixed-citation></ref>
      <ref id="bib1.bibx88"><label>Rolnick et al.(2024)Rolnick, Aspuru-Guzik, Beery, Dilkina, Donti, Ghassemi, Kerner, Monteleoni, Rolf, Tambe, and White</label><mixed-citation>Rolnick, D., Aspuru-Guzik, A., Beery, S., Dilkina, B., Donti, P. L., Ghassemi, M., Kerner, H., Monteleoni, C., Rolf, E., Tambe, M., and White, A.: Application-Driven Innovation in Machine Learning, arXiv, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2403.17381" ext-link-type="DOI">10.48550/arXiv.2403.17381</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx89"><label>Ronchetti et al.(2024)Ronchetti, Nisini Scacchiafichi, Seguini, Cerrani, and van der Velde</label><mixed-citation>Ronchetti, G., Nisini Scacchiafichi, L., Seguini, L., Cerrani, I., and van der Velde, M.: Harmonized European Union subnational crop statistics can reveal climate impacts and crop cultivation shifts, Earth Syst. Sci. Data, 16, 1623–1649, <ext-link xlink:href="https://doi.org/10.5194/essd-16-1623-2024" ext-link-type="DOI">10.5194/essd-16-1623-2024</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx90"><label>Rußwurm et al.(2019)Rußwurm, Lefèvre, and Körner</label><mixed-citation>Rußwurm, M., Lefèvre, S., and Körner, M.: BreizhCrops: A Satellite Time Series Dataset for Crop Type Identification, arXiv, <ext-link xlink:href="https://doi.org/10.48550/arXiv.1905.11893" ext-link-type="DOI">10.48550/arXiv.1905.11893</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx91"><label>Rußwurm and Körner(2018)</label><mixed-citation>Rußwurm, M. and Körner, M.: Multi-Temporal Land Cover Classification with Sequential Recurrent Encoders, ISPRS Int. J. Geo-Inf., 7, <ext-link xlink:href="https://doi.org/10.3390/ijgi7040129" ext-link-type="DOI">10.3390/ijgi7040129</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx92"><label>Sacks et al.(2010)Sacks, Deryng, Foley, and Ramankutty</label><mixed-citation> Sacks, W. J., Deryng, D., Foley, J. A., and Ramankutty, N.: Crop planting dates: an analysis of global patterns, Global Ecol. Biogeogr., 19, 607–620, 2010.</mixed-citation></ref>
      <ref id="bib1.bibx93"><label>Sainte Fare Garnot et al.(2020)Sainte Fare Garnot, Landrieu, Giordano, and Chehata</label><mixed-citation>Sainte Fare Garnot, V., Landrieu, L., Giordano, S., and Chehata, N.: Satellite Image Time Series Classification with Pixel-Set Encoders and Temporal Self-Attention, CVPR, <ext-link xlink:href="https://doi.org/10.1109/CVPR42600.2020.01234" ext-link-type="DOI">10.1109/CVPR42600.2020.01234</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx94"><label>Schauberger et al.(2020)Schauberger, Jägermeyr, and Gornott</label><mixed-citation>Schauberger, B., Jägermeyr, J., and Gornott, C.: A systematic review of local to regional yield forecasting approaches and frequently used data resources, Eur. J. Agron., 120, 126153, <ext-link xlink:href="https://doi.org/10.1016/j.eja.2020.126153" ext-link-type="DOI">10.1016/j.eja.2020.126153</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx95"><label>Schlenker and Roberts(2009)</label><mixed-citation>Schlenker, W. and Roberts, M. J.: Nonlinear temperature effects indicate severe damages to U.S. crop yields under climate change, P. Natl. Acad. Sci., 106, 15594–15598, <ext-link xlink:href="https://doi.org/10.1073/pnas.0906865106" ext-link-type="DOI">10.1073/pnas.0906865106</ext-link>, 2009.</mixed-citation></ref>
      <ref id="bib1.bibx96"><label>Schneider et al.(2023a)</label><mixed-citation>Schneider, K. R., Fanzo, J., Haddad, L., Herrero, M., Moncayo, J. R., Herforth, A., Remans, R., Guarin, A., Resnick, D., Covic, N., Béné, C., Cattaneo, A., Aburto, N., Ambikapathi, R., Aytekin, D., Barquera, S., Battersby, J., Beal, T., Molina, P. B., Cafiero, C., Campeau, C., Caron, P., Conforti, P., Damerau, K., Di Girolamo, M., DeClerck, F., Dewi, D., Elouafi, I., Fabi, C., Foley, P., Frazier, T. J., Gephart, J., Golden, C., Fischer, C. G., Hendriks, S., Honorati, M., Huang, J., Kennedy, G., Laar, A., Lal, R., Lidder, P., Loken, B., Marshall, Q., Masuda, Y. J., McLaren, R., Miachon, L., Muñoz, H., Nordhagen, S., Qayyum, N., Saisana, M., Suhardiman, D., Sumaila, U. R., Cullen, M. T., Tubiello, F. N., Vivero-Pol, J.-L., Webb, P., and Wiebe, K.: The state of food systems worldwide in the countdown to 2030, Nature Food, 4, 1090–1110, <ext-link xlink:href="https://doi.org/10.1038/s43016-023-00885-9" ext-link-type="DOI">10.1038/s43016-023-00885-9</ext-link>, 2023a.</mixed-citation></ref>
      <ref id="bib1.bibx97"><label>Schneider et al.(2023b)Schneider, Schelte, Schmitz et al.</label><mixed-citation>Schneider, M., Schelte, T., Schmitz, F., and Körner, M.: EuroCrops: The Largest Harmonized Open Crop Dataset Across the European Union, Sci. Data, 10, 612, <ext-link xlink:href="https://doi.org/10.1038/s41597-023-02517-0" ext-link-type="DOI">10.1038/s41597-023-02517-0</ext-link>, 2023b.</mixed-citation></ref>
      <ref id="bib1.bibx98"><label>Seguini et al.(2026)Seguini, Klisch, Meroni, Vrieling, Manfron, Atzberger, and Rembold</label><mixed-citation>Seguini, L., Klisch, A., Meroni, M., Vrieling, A., Manfron, G., Atzberger, C., and Rembold, F.: Global near real-time 500 m 10 d FPAR dataset from MODIS and VIIRS for operational agricultural monitoring and crop yield forecasting, Earth Syst. Sci. Data, 18, 309–331, <ext-link xlink:href="https://doi.org/10.5194/essd-18-309-2026" ext-link-type="DOI">10.5194/essd-18-309-2026</ext-link>, 2026.</mixed-citation></ref>
      <ref id="bib1.bibx99"><label>Seidel et al.(2018)Seidel, Palosuo, Thorburn, and Wallach</label><mixed-citation>Seidel, S., Palosuo, T., Thorburn, P., and Wallach, D.: Towards improved calibration of crop models – Where are we now and where should we go?, Eur. J. Agron., 94, 25–35, <ext-link xlink:href="https://doi.org/10.1016/j.eja.2018.01.006" ext-link-type="DOI">10.1016/j.eja.2018.01.006</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx100"><label>Singh et al.(2022)</label><mixed-citation>Singh, K., Singh, D., Goroshi, S., Yashu, S., Kumar, Y., Solanki, S., and  Sagar, S.: Crop Yield forecasting under FASAL (Forecasting Agricultural  output using Space Agrometeorology and Land based observations), Tech. rep., India Meteorological Department (IMD), Ministry of Earth Sciences (MoES), Government of India, <ext-link xlink:href="https://doi.org/10.13140/RG.2.2.11593.42083" ext-link-type="DOI">10.13140/RG.2.2.11593.42083</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx101"><label>Stuart et al.(2024)Stuart, Hobbins, Niebuhr, Ruane, Pulwarty, Hoell, Thiaw, Rosenzweig, Muñoz-Arriola, Jahn et al.</label><mixed-citation>Stuart, L., Hobbins, M., Niebuhr, E., Ruane, A. C., Pulwarty, R., Hoell, A.,  Thiaw, W., Rosenzweig, C., Muñoz-Arriola, F., Jahn, M., and Farrar, M.: Enhancing Global Food Security: Opportunities for the American  Meteorological Society, B. Am. Meteorol. Soc., 104, E760–E777, <ext-link xlink:href="https://doi.org/10.1175/BAMS-D-22-0106.1" ext-link-type="DOI">10.1175/BAMS-D-22-0106.1</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx102"><label>Sweet et al.(2023)Sweet, Müller, Anand, and Zscheischler</label><mixed-citation>Sweet, L.-b., Müller, C., Anand, M., and Zscheischler, J.: Cross-Validation Strategy Impacts the Performance and Interpretation of Machine Learning Models, Artificial Intelligence for the Earth Systems, 2, <ext-link xlink:href="https://doi.org/10.1175/AIES-D-23-0026.1" ext-link-type="DOI">10.1175/AIES-D-23-0026.1</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx103"><label>Sweet et al.(2025)Sweet, Athanasiadis, van Bree, Castellano, Martre, Paudel, Ruane, and Zscheischler</label><mixed-citation>Sweet, L. B., Athanasiadis, I. N., van Bree, R., Castellano, A., Martre, P., Paudel, D., Ruane, A. C., and Zscheischler, J.: Transdisciplinary coordination is essential for advancing agricultural modeling with machine learning, One Earth, <ext-link xlink:href="https://doi.org/10.1016/j.oneear.2025.101233" ext-link-type="DOI">10.1016/j.oneear.2025.101233</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx104"><label>Tadesse et al.(2015)Tadesse, Senay, Berhan, Regassa, and Beyene</label><mixed-citation> Tadesse, T., Senay, G. B., Berhan, G., Regassa, T., and Beyene, S.: Evaluating a satellite-based seasonal evapotranspiration product and identifying its relationship with other satellite-derived products and crop yield: A case study for Ethiopia, Int. J. Applied Earth Obs., 40, 39–54, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx105"><label>Tanaka et al.(2023)Tanaka, Sun, Becker-Reshef, Song, and Puricelli</label><mixed-citation>Tanaka, T., Sun, L., Becker-Reshef, I., Song, X.-P., and Puricelli, E.: Satellite forecasting of crop harvest can trigger a cross-hemispheric production response and improve global food security, Commun. Earth Environ., 4, 1–9, <ext-link xlink:href="https://doi.org/10.1038/s43247-023-00992-2" ext-link-type="DOI">10.1038/s43247-023-00992-2</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx106"><label>Thomas and Uminsky(2022)</label><mixed-citation>Thomas, R. L. and Uminsky, D.: Reliance on metrics is a fundamental challenge for AI, Patterns, 3, 100476, <ext-link xlink:href="https://doi.org/10.1016/j.patter.2022.100476" ext-link-type="DOI">10.1016/j.patter.2022.100476</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx107"><label>Tsaftaris and Scharr(2019)</label><mixed-citation>Tsaftaris, S. A. and Scharr, H.: Sharing the Right Data Right: A Symbiosis with Machine Learning, Trends  Plant Sci., 24, 99–102, <ext-link xlink:href="https://doi.org/10.1016/j.tplants.2018.10.016" ext-link-type="DOI">10.1016/j.tplants.2018.10.016</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx108"><label>Tseng et al.(2021a)Tseng, Kerner, Nakalembe, and Becker-Reshef</label><mixed-citation>Tseng, G., Kerner, H., Nakalembe, C., and Becker-Reshef, I.: Learning to predict crop type from heterogeneous sparse labels using meta-learning, in: 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), 1111–1120, <ext-link xlink:href="https://doi.org/10.1109/CVPRW53098.2021.00122" ext-link-type="DOI">10.1109/CVPRW53098.2021.00122</ext-link>, 2021a.</mixed-citation></ref>
      <ref id="bib1.bibx109"><label>Tseng et al.(2021b)Tseng, Zvonkov, Nakalembe, and Kerner</label><mixed-citation>Tseng, G., Zvonkov, I., Nakalembe, C., and Kerner, H.: CropHarvest: A global  dataset for crop-type classification, in: Proceedings of the Neural  Information Processing Systems Track on Datasets and Benchmarks, edited by:  Vanschoren, J. and Yeung, S., Vol. 1, Curran, <uri>https://openreview.net/pdf?id=JtjzUXPEaCu</uri> (last access: 30 May 2026),  2021b.</mixed-citation></ref>
      <ref id="bib1.bibx110"><label>Tseng et al.(2022)Tseng, Kerner, and Rolnick</label><mixed-citation>Tseng, G., Kerner, H., and Rolnick, D.: TIML: Task-Informed Meta-Learning for Agriculture, arXiv, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2202.02124" ext-link-type="DOI">10.48550/arXiv.2202.02124</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx111"><label>Tzachor et al.(2022)Tzachor, Devare, King, Avin, and Ó hÉigeartaigh</label><mixed-citation>Tzachor, A., Devare, M., King, B., Avin, S., and Ó hÉigeartaigh, S.: Responsible artificial intelligence in agriculture requires systemic understanding of risks and externalities, Nature Machine Intelligence, 4, 104–109, <ext-link xlink:href="https://doi.org/10.1038/s42256-022-00440-4" ext-link-type="DOI">10.1038/s42256-022-00440-4</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx112"><label>van der Velde and Nisini(2019)</label><mixed-citation>van der Velde, M. and Nisini, L.: Performance of the MARS-crop yield forecasting system for the European Union: Assessing accuracy, in-season, and year-to-year improvements from 1993 to 2015, Agr. Syst., 168, 203–212, <ext-link xlink:href="https://doi.org/10.1016/j.agsy.2018.06.009" ext-link-type="DOI">10.1016/j.agsy.2018.06.009</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx113"><label>Van Klompenburg et al.(2020)Van Klompenburg, Kassahun, and Catal</label><mixed-citation>Van Klompenburg, T., Kassahun, A., and Catal, C.: Crop yield prediction using machine learning: A systematic literature review, Comput. Electron. Agr., 177, 105709, <ext-link xlink:href="https://doi.org/10.1016/j.compag.2020.105709" ext-link-type="DOI">10.1016/j.compag.2020.105709</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx114"><label>Van Tricht et al.(2023)Van Tricht, Degerickx, Gilliams, Zanaga, Battude, Grosu, Brombacher, Lesiv, Bayas, Karanam et al.</label><mixed-citation>Van Tricht, K., Degerickx, J., Gilliams, S., Zanaga, D., Battude, M., Grosu, A., Brombacher, J., Lesiv, M., Bayas, J. C. L., Karanam, S., Fritz, S., Becker-Reshef, I., Franch, B., Mollà-Bononad, B., Boogaard, H., Pratihast, A. K., Koetz, B., and Szantoi, Z.: WorldCereal: a dynamic open-source system for global-scale, seasonal, and reproducible crop and irrigation mapping, Earth Syst. Sci. Data, 15, 5491–5515, <ext-link xlink:href="https://doi.org/10.5194/essd-15-5491-2023" ext-link-type="DOI">10.5194/essd-15-5491-2023</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx115"><label>Vermote(2015)</label><mixed-citation>Vermote, E.: MOD09CMG MODIS/Terra Surface Reflectance Daily L3 Global 0.05Deg  CMG V006, NASA Land Processes Distributed Active Archive Center [data set], <ext-link xlink:href="https://doi.org/10.5067/MODIS/MOD09CMG.006" ext-link-type="DOI">10.5067/MODIS/MOD09CMG.006</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx116"><label>Vijverberg et al.(2023)Vijverberg, Hamed, and Coumou</label><mixed-citation>Vijverberg, S., Hamed, R., and Coumou, D.: Skillful U.S. Soy Yield Forecasts at Presowing Lead Times, Artificial Intelligence for the Earth Systems, 2, <ext-link xlink:href="https://doi.org/10.1175/AIES-D-21-0009.1" ext-link-type="DOI">10.1175/AIES-D-21-0009.1</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx117"><label>Waha et al.(2012)Waha, Van Bussel, Müller, and Bondeau</label><mixed-citation>Waha, K., Van Bussel, L., Müller, C., and Bondeau, A.: Climate-driven simulation of global crop sowing dates, Global Ecol. Biogeogr., 21, 247–259, <ext-link xlink:href="https://doi.org/10.1111/j.1466-8238.2011.00678.x" ext-link-type="DOI">10.1111/j.1466-8238.2011.00678.x</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bibx118"><label>Wallach et al.(2021)Wallach, Palosuo, Thorburn, Hochman, Gourdain, Andrianasolo, Asseng, Basso, Buis, Crout, Dibari, Dumont, Ferrise, Gaiser, Garcia, Gayler, Ghahramani, Hiremath, Hoek, Horan, Hoogenboom, Huang, Jabloun, Jansson, Jing, Justes, Kersebaum, Klosterhalfen, Launay, Lewan, Luo, Maestrini, Mielenz, Moriondo, Nariman Zadeh, Padovan, Olesen, Poyda, Priesack, Pullens, Qian, Schütze, Shelia, Souissi, Specka, Srivastava, Stella, Streck, Trombi, Wallor, Wang, Weber, Weihermüller, de Wit, Wöhling, Xiao, Zhao, Zhu, and Seidel</label><mixed-citation>Wallach, D., Palosuo, T., Thorburn, P., Hochman, Z., Gourdain, E., Andrianasolo, F., Asseng, S., Basso, B., Buis, S., Crout, N., Dibari, C., Dumont, B., Ferrise, R., Gaiser, T., Garcia, C., Gayler, S., Ghahramani, A., Hiremath, S., Hoek, S., Horan, H., Hoogenboom, G., Huang, M., Jabloun, M., Jansson, P.-E., Jing, Q., Justes, E., Kersebaum, K. C., Klosterhalfen, A., Launay, M., Lewan, E., Luo, Q., Maestrini, B., Mielenz, H., Moriondo, M., Nariman Zadeh, H., Padovan, G., Olesen, J. E., Poyda, A., Priesack, E., Pullens, J. W. M., Qian, B., Schütze, N., Shelia, V., Souissi, A., Specka, X., Srivastava, A. K., Stella, T., Streck, T., Trombi, G., Wallor, E., Wang, J., Weber, T. K., Weihermüller, L., de Wit, A., Wöhling, T., Xiao, L., Zhao, C., Zhu, Y., and Seidel, S. J.: The chaos in calibrating crop models: Lessons learned from a multi-model calibration exercise, Environ. Model. Softw., 145, 105206, <ext-link xlink:href="https://doi.org/10.1016/j.envsoft.2021.105206" ext-link-type="DOI">10.1016/j.envsoft.2021.105206</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx119"><label>Wang et al.(2022)Wang, Albrecht, Braham, Mou, and Zhu</label><mixed-citation>Wang, Y., Albrecht, C. M., Braham, N. A. A., Mou, L., and Zhu, X. X.: Self-supervised learning in remote sensing: A review, IEEE Geosci. Remote S., 10, 213–247, 2022.  </mixed-citation></ref>
      <ref id="bib1.bibx120"><label>Watson(2022)</label><mixed-citation>Watson, P. A. G.: Machine learning applications for weather and climate need greater focus on extremes, Environ. Res. Lett., 17, 111004, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/ac9d4e" ext-link-type="DOI">10.1088/1748-9326/ac9d4e</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx121"><label>Xu et al.(2024)Xu, Ma, and Zhang</label><mixed-citation> Xu, Y., Ma, Y., and Zhang, Z.: Self-supervised pre-training for large-scale crop mapping using Sentinel-2 time series, ISPRS J. Photogramm., 207, 312–325, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx122"><label>Yeh et al.(2021)</label><mixed-citation>Yeh, C., Meng, C., Wang, S., Driscoll, A., Rozi, E., Liu, P., Lee, J., Burke,  M., Lobell, D., and Ermon, S.: SustainBench: Benchmarks for Monitoring the  Sustainable Development Goals with Machine Learning, in: Thirty-fifth  Conference on Neural Information Processing Systems, Datasets and Benchmarks  Track (Round 2), Curran Associates, Inc., <uri>https://openreview.net/forum?id=5HR3vCylqD</uri> (last access: 30 May 2026),  2021.</mixed-citation></ref>
      <ref id="bib1.bibx123"><label>You et al.(2017)You, Li, Low, Lobell, and Ermon</label><mixed-citation>You, J., Li, X., Low, M., Lobell, D., and Ermon, S.: Deep Gaussian Process for Crop Yield Prediction Based on Remote Sensing Data, in: Proceedings of the AAAI Conference on Artificial Intelligence, Association for the Advancement of Artificial Intelligence (AAAI), Vol. 31,  <ext-link xlink:href="https://doi.org/10.1609/aaai.v31i1.11172" ext-link-type="DOI">10.1609/aaai.v31i1.11172</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx124"><label>Zelingher and Makowski(2023)</label><mixed-citation>Zelingher, R. and Makowski, D.: Investigating and forecasting the impact of crop production shocks on global commodity prices, Environ. Res. Lett., 19, 014026, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/ad0dda" ext-link-type="DOI">10.1088/1748-9326/ad0dda</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx125"><label>Zhang et al.(2022)Zhang, van der Wiel, Wei, Screen, Yue, Zheng, Selten, Bintanja, Anderson, Blackport, Glomsrød, Liu, Cui, and Yang</label><mixed-citation>Zhang, T., van der Wiel, K., Wei, T., Screen, J., Yue, X., Zheng, B., Selten, F., Bintanja, R., Anderson, W., Blackport, R., Glomsrød, S., Liu, Y., Cui, X., and Yang, X.: Increased wheat price spikes and larger economic inequality with 2 °C global warming, One Earth, 5, 907–916, <ext-link xlink:href="https://doi.org/10.1016/j.oneear.2022.07.004" ext-link-type="DOI">10.1016/j.oneear.2022.07.004</ext-link>, 2022.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>CY-Bench: a comprehensive benchmark dataset for sub-national crop yield forecasting</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>Ambikapathi et al.(2022)Ambikapathi, Schneider, Davis, Herrero,
Winters, and Fanzo</label><mixed-citation>
      
Ambikapathi, R., Schneider, K. R., Davis, B., Herrero, M., Winters, P., and
Fanzo, J. C.: Global food systems transitions have enabled affordable diets
but had less favourable outcomes for nutrition, environmental health,
inclusion and equity, Nature Food, 3, 764–779,
<a href="https://doi.org/10.1038/s43016-022-00588-7" target="_blank">https://doi.org/10.1038/s43016-022-00588-7</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>Argentina(2016)</label><mixed-citation>
      
Argentina: Ministerio de Agrícultura, Ganaderia y Pesca. “Estimaciones
Agrícolas”,
<a href="https://datosestimaciones.magyp.gob.ar/reportes.php?reporte=Estimaciones" target="_blank"/>
(last access: 29 April 2016), 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>Australia(2024)</label><mixed-citation>
      
Australia: ABARES. Australian Bureau of Agricultural and Resource Economics and
Sciences Farm Data Portal,
<a href="https://www.agriculture.gov.au/abares/data/farm-data-portal#data-download" target="_blank"/>
(last access: 5 March 2024), 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>Basso and Liu(2019)</label><mixed-citation>
      
Basso, B. and Liu, L.: Seasonal crop yield forecast: Methods, applications, and
accuracies, Adv. Agron.,  154, 201–255,
<a href="https://doi.org/10.1016/bs.agron.2018.11.002" target="_blank">https://doi.org/10.1016/bs.agron.2018.11.002</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>Batjes(2016)</label><mixed-citation>
      
Batjes, N. H.: Harmonized soil property values for broad-scale modelling
(WISE30sec) with estimates of global soil carbon stocks, Geoderma, 269,
61–68, <a href="https://doi.org/10.1016/j.geoderma.2016.01.034" target="_blank">https://doi.org/10.1016/j.geoderma.2016.01.034</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>Becker-Reshef et al.(2020)Becker-Reshef, Justice, Barker, Humber,
Rembold, Bonifacio, Zappacosta, Budde, Magadzire, Shitote, Pound,
Constantino, Nakalembe, Mwangi, Sobue, Newby, Whitcraft, Jarvis, and
Verdin</label><mixed-citation>
      
Becker-Reshef, I., Justice, C., Barker, B., Humber, M., Rembold, F., Bonifacio,
R., Zappacosta, M., Budde, M., Magadzire, T., Shitote, C., Pound, J.,
Constantino, A., Nakalembe, C., Mwangi, K., Sobue, S., Newby, T., Whitcraft,
A., Jarvis, I., and Verdin, J.: Strengthening agricultural decisions in
countries at risk of food insecurity: The GEOGLAM Crop Monitor for Early
Warning, Remote Sens. Environ., 237, 111553,
<a href="https://doi.org/10.1016/j.rse.2019.111553" target="_blank">https://doi.org/10.1016/j.rse.2019.111553</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>Becker-Reshef et al.(2023)Becker-Reshef, Barker, Whitcraft, Oliva,
Mobley, Justice, and Sahajpal</label><mixed-citation>
      
Becker-Reshef, I., Barker, B., Whitcraft, A., Oliva, P., Mobley, K., Justice,
C., and Sahajpal, R.: Crop type maps for operational global agricultural
monitoring, Sci. Data, 10, 172, <a href="https://doi.org/10.1038/s41597-023-02047-9" target="_blank">https://doi.org/10.1038/s41597-023-02047-9</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>Benos et al.(2021)Benos, Tagarakis, Dolias, Berruto, Kateris, and
Bochtis</label><mixed-citation>
      
Benos, L., Tagarakis, A. C., Dolias, G., Berruto, R., Kateris, D., and Bochtis,
D.: Machine learning in agriculture: A comprehensive updated review, Sensors,
21, 3758, <a href="https://doi.org/10.3390/s21113758" target="_blank">https://doi.org/10.3390/s21113758</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>Boogaard et al.(2022)Boogaard, Schubert, De Wit, Lazebnik, Hutjes,
and Van der Grijn</label><mixed-citation>
      
Boogaard, H., Schubert, J., De Wit, A., Lazebnik, J., Hutjes, R., and Van der
Grijn, G.: Agrometeorological indicators from 1979 to present derived from
reanalysis, Climate Data Store – Copernicus Climate Change Service,
<a href="https://doi.org/10.24381/cds.6c68c9bb" target="_blank">https://doi.org/10.24381/cds.6c68c9bb</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>Boryan et al.(2011)Boryan, Yang, Mueller, and
Craig</label><mixed-citation>
      
Boryan, C., Yang, Z., Mueller, R., and Craig, M.: Monitoring US agriculture:
the US department of agriculture, national agricultural statistics service,
cropland data layer program, Geocarto Int., 26, 341–358, 2011.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>Brazil(2022)</label><mixed-citation>
      
Brazil: IBGE SIDRA. “Tabela 1612: Área plantada, área colhida, quantidade
produzida, rendimento médio e valor da produção das lavouras
temporárias”, <a href="https://sidra.ibge.gov.br/tabela/1612" target="_blank"/> (last access:
6 February 2024), 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>Burnell et al.(2023)Burnell, Schellaert, Burden, Ullman,
Martinez-Plumed, Tenenbaum, Rutar, Cheke, Sohl-Dickstein, Mitchell, Kiela,
Shanahan, Voorhees, Cohn, Leibo, and Hernandez-Orallo</label><mixed-citation>
      
Burnell, R., Schellaert, W., Burden, J., Ullman, T. D., Martinez-Plumed, F.,
Tenenbaum, J. B., Rutar, D., Cheke, L. G., Sohl-Dickstein, J., Mitchell, M.,
Kiela, D., Shanahan, M., Voorhees, E. M., Cohn, A. G., Leibo, J. Z., and
Hernandez-Orallo, J.: Rethink reporting of evaluation results in AI,
Science, 380, 136–138, <a href="https://doi.org/10.1126/science.adf6369" target="_blank">https://doi.org/10.1126/science.adf6369</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>Chen and Villoria(2022)</label><mixed-citation>
      
Chen, B. and Villoria, N. B.: Foreign yield shocks and domestic price
variability: the case of maize in developing countries, Environ.
Res. Lett., 17, 124044, <a href="https://doi.org/10.1088/1748-9326/aca7d5" target="_blank">https://doi.org/10.1088/1748-9326/aca7d5</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>China(2024)</label><mixed-citation>
      
China: National Bureau of Statistics of China, National Data Portal,
<a href="https://data.stats.gov.cn" target="_blank"/> (last access: 18 February 2024), 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>Chlingaryan et al.(2018)Chlingaryan, Sukkarieh, and
Whelan</label><mixed-citation>
      
Chlingaryan, A., Sukkarieh, S., and Whelan, B.: Machine learning approaches for
crop yield prediction and nitrogen status estimation in precision
agriculture: A review, Comput. Electron. Agr., 151, 61–69,
<a href="https://doi.org/10.1016/j.compag.2018.05.012" target="_blank">https://doi.org/10.1016/j.compag.2018.05.012</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>Coulibaly et al.(2019)Coulibaly, Kamsu-Foguem, Kamissoko, and
Traore</label><mixed-citation>
      
Coulibaly, S., Kamsu-Foguem, B., Kamissoko, D., and Traore, D.: Deep neural
networks with transfer learning in millet crop images, Comput. Ind.,
108, 115–120, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>Cunha et al.(2018)Cunha, Silva, and Netto</label><mixed-citation>
      
Cunha, R. L., Silva, B., and Netto, M. A.: A scalable machine learning system  for pre-season agriculture yield forecast, in: 2018 IEEE 14th international  conference on e-science (e-Science), IEEE, 423–430, <a href="https://doi.org/10.1109/eScience.2018.00131" target="_blank">https://doi.org/10.1109/eScience.2018.00131</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>Darbyshire et al.(2020)Darbyshire, Crean, Cashen, Anwar, Broadfoot,
Simpson, Cobon, Pudmenzky, Kouadio, and Kodur</label><mixed-citation>
      
Darbyshire, R., Crean, J., Cashen, M., Anwar, M. R., Broadfoot, K. M., Simpson,
M., Cobon, D. H., Pudmenzky, C., Kouadio, L., and Kodur, S.: Insights into
the value of seasonal climate forecasts to agriculture, Aust. J. Agr. Resour. Ec., 64, 1034–1058,
<a href="https://doi.org/10.1111/1467-8489.12389" target="_blank">https://doi.org/10.1111/1467-8489.12389</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>Davis et al.(2025)</label><mixed-citation>
      
Davis, K. F., Anderson, W., Ehrmann, S., Flach, R., Meyer, C., Proctor, J.,  Ray, D. K., You, L., Foley, M., Kerdiles, H., Hultgren, A., Huybers, P., Kebede, E., Meroni, M., Park, C., and Lee, D.: HarvestStat: A global  effort towards open and standardized sub-national agricultural data,  Environ. Res. Lett., 20, 052001, <a href="https://doi.org/10.1088/1748-9326/adcb54" target="_blank">https://doi.org/10.1088/1748-9326/adcb54</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>Duden et al.(2024)Duden, Nacke, and Offermann</label><mixed-citation>
      
Duden, C., Nacke, C., and Offermann, F.: German yield and area data for 11
crops from 1979 to 2021 at a harmonized spatial resolution of 397 districts,
Sci. Data, 11, <a href="https://doi.org/10.1038/s41597-024-02951-8" target="_blank">https://doi.org/10.1038/s41597-024-02951-8</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>Dueben et al.(2022)Dueben, Schultz, Chantry, Gagne, Hall, and
McGovern</label><mixed-citation>
      
Dueben, P. D., Schultz, M. G., Chantry, M., Gagne, D. J., Hall, D. M., and
McGovern, A.: Challenges and Benchmark Datasets for Machine Learning
in the Atmospheric Sciences: Definition, Status, and Outlook,
Artificial Intelligence for the Earth Systems, 1,
<a href="https://doi.org/10.1175/AIES-D-21-0002.1" target="_blank">https://doi.org/10.1175/AIES-D-21-0002.1</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>EC-JRC(2024)</label><mixed-citation>
      
EC-JRC: Elaboration of Van Tricht et al, 2023, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>Ennaji et al.(2023)Ennaji, Vergutz, and El Allali</label><mixed-citation>
      
Ennaji, O., Vergutz, L., and El Allali, A.: Machine learning in nutrient
management: A review, Artificial Intelligence in Agriculture, 9, 1–11,
<a href="https://doi.org/10.1016/j.aiia.2023.06.001" target="_blank">https://doi.org/10.1016/j.aiia.2023.06.001</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>Ennaji et al.(2024)Ennaji, Baha, Vergutz, and
El Allali</label><mixed-citation>
      
Ennaji, O., Baha, S., Vergutz, L., and El Allali, A.: Gradient boosting for
yield prediction of elite maize hybrid ZhengDan 958, PloS One, 19,
e0315493, <a href="https://doi.org/10.1371/journal.pone.0315493" target="_blank">https://doi.org/10.1371/journal.pone.0315493</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>Fan et al.(2022)Fan, Bai, Li, Ortiz-Bobea, and Gomes</label><mixed-citation>
      
Fan, J., Bai, J., Li, Z., Ortiz-Bobea, A., and Gomes, C.: A GNN-RNN Approach
for Harnessing Geospatial and Temporal Information: Application to Crop Yield
Prediction, Proceedings of the AAAI Conference on Artificial Intelligence,
36, 11873–11881, <a href="https://doi.org/10.1609/aaai.v36i11.21444" target="_blank">https://doi.org/10.1609/aaai.v36i11.21444</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>Fanzo(2024)</label><mixed-citation>
      
Fanzo, J.: Kicking around in the wreck, PLOS Climate, 3, e0000401,
<a href="https://doi.org/10.1371/journal.pclm.0000401" target="_blank">https://doi.org/10.1371/journal.pclm.0000401</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>FAO(2025)</label><mixed-citation>
      
FAO: Crop Calendar Food and Agriculture Organization of the United Nations,
<a href="https://cropcalendar.apps.fao.org" target="_blank"/> (last access: 11 February 2025), 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>Fernandez-Beltran et al.(2021)Fernandez-Beltran, Baidar, Kang, and
Pla</label><mixed-citation>
      
Fernandez-Beltran, R., Baidar, T., Kang, J., and Pla, F.: Rice-Yield
Prediction with Multi-Temporal Sentinel-2 Data and 3D CNN: A Case Study in
Nepal, Remote Sensing, 13, 1391, <a href="https://doi.org/10.3390/rs13071391" target="_blank">https://doi.org/10.3390/rs13071391</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>Franch et al.(2022)</label><mixed-citation>
      
Franch, B., Cintas, J., Becker-Reshef, I., Sanchez-Torres, M. J., Roger, J.,  Skakun, S., Sobrino, J. A., Van Tricht, K., Degerickx, J., Gilliams, S.,  Koetz, B., Szantoi, Z., and Whitcraft, A.: Global crop calendars of maize and wheat in the framework of the WorldCereal project, GISci. Remote Sens., 59, 885–913, <a href="https://doi.org/10.1080/15481603.2022.2079273" target="_blank">https://doi.org/10.1080/15481603.2022.2079273</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>Frieler et al.(2017)</label><mixed-citation>
      
Frieler, K., Schauberger, B., Arneth, A., Balkovič, J.,  Chryssanthacopoulos, J., Deryng, D., Elliott, J., Folberth, C., Khabarov, N.,  Müller, C., Olin, S., Pugh, T.A.M., Schaphoff, S., Schewe, J., Schmid, E., Warszawski, L., andLevermann, A.: Understanding the weather signal in national
crop-yield variability, Earth's Future, 5, 605–616,
<a href="https://doi.org/10.1002/2016EF000525" target="_blank">https://doi.org/10.1002/2016EF000525</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>Gavasso-Rita et al.(2023)Gavasso-Rita, Papalexiou, Li, Elshorbagy,
Li, and Schuster-Wallace</label><mixed-citation>
      
Gavasso-Rita, Y. L., Papalexiou, S. M., Li, Y., Elshorbagy, A., Li, Z., and
Schuster-Wallace, C.: Crop models and their use in assessing crop production
and food security: A review, Food and Energy Security, 13, e503,
<a href="https://doi.org/10.1002/fes3.503" target="_blank">https://doi.org/10.1002/fes3.503</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>Good and Irwin(2003)</label><mixed-citation>
      
Good, D. L. and Irwin, S. H.: Understanding USDA corn and soybean production  forecasts: An overview of methods, performance and market impacts, <a href="https://doi.org/10.22004/ag.econ.37496" target="_blank">https://doi.org/10.22004/ag.econ.37496</a>, 2003.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>Hatfield and Prueger(2015)</label><mixed-citation>
      
Hatfield, J. L. and Prueger, J. H.: Temperature extremes: Effect on plant
growth and development, Weather and Climate Extremes, 10, 4–10, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>He et al.(2017)He, Wang, Wang, and Robertson</label><mixed-citation>
      
He, D., Wang, E., Wang, J., and Robertson, M.: Data requirement for effective
calibration of process-based crop models, Agr. Forest
Meteorol., 234–235, 136–148, <a href="https://doi.org/10.1016/j.agrformet.2016.12.015" target="_blank">https://doi.org/10.1016/j.agrformet.2016.12.015</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>Hengl et al.(2017)</label><mixed-citation>
      
Hengl, T., Mendes de Jesus, J., Heuvelink, G. B., Ruiperez Gonzalez, M.,
Kilibarda, M., Blagotić, A., Shangguan, W., Wright, M. N., Geng, X.,
Bauer-Marschallinger, B., Guevara, M. A., Vargas, R., MacMillan, R. A.,
Batjes, N. H., Leenaars, J. G. B., Ribeiro, E., Wheeler, I., Mantel, S., and
Kempen, B.: SoilGrids250m: Global gridded soil information based on machine
learning, PLoS One, 12, e0169748, <a href="https://doi.org/10.1371/journal.pone.0169748" target="_blank">https://doi.org/10.1371/journal.pone.0169748</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>Hoffmann et al.(2016)</label><mixed-citation>
      
Hoffmann, H., Zhao, G., Asseng, S., Bindi, M., Biernath, C., Constantin, J.,  Coucheney, E., Dechow, R., Doro, L., Eckersten, H., Gaiser, T., Grosz, B., Heinlein, F., Kassie, B. T., Kersebaum, K.-C., Klein, C., Kuhnert, M., Lewan, E., Moriondo, M., Nendel, C., Priesack, E., Raynal, H., Roggero, P. P., Rötter, R. P., Siebert, S., Specka, X., Tao, F., Teixeira, E., Trombi, G., Wallach, D., Weihermüller, L., Yeluripati, J., and Ewert, F.: Impact of spatial soil and climate input data aggregation on regional yield simulations, PloS One, 11, e0151782, <a href="https://doi.org/10.1371/journal.pone.0151782" target="_blank">https://doi.org/10.1371/journal.pone.0151782</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>Höhl et al.(2023)Höhl, Ofori-Ampofo, Obadic,
Fernández-Torres, Salih Kuzu, and Zhu</label><mixed-citation>
      
Höhl, A., Ofori-Ampofo, S., Obadic, I., Fernández-Torres, M.-Á., Salih Kuzu, R., and Zhu, X.: USCC: A Benchmark Dataset for Crop Yield Prediction under Climate Extremes, EGU General Assembly 2023, Vienna, Austria, 23–28 Apr 2023, EGU23-15540, <a href="https://doi.org/10.5194/egusphere-egu23-15540" target="_blank">https://doi.org/10.5194/egusphere-egu23-15540</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>Huete et al.(2002)Huete, Didan, Miura, Rodriguez, Gao, and
Ferreira</label><mixed-citation>
      
Huete, A., Didan, K., Miura, T., Rodriguez, E. P., Gao, X., and Ferreira,
L. G.: Overview of the radiometric and biophysical performance of the MODIS
vegetation indices, Remote Sens. Environ., 83, 195–213, 2002.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>ICRISAT Mali(2018)</label><mixed-citation>
      
ICRISAT Mali: Compagnie Malienne pour le Developpement des Textiles (CMDT)  Monitoring Operational Maize Yield Statistics, <a href="http://data.icrisat.org/dataverse/" target="_blank"/> (last access: 30 May 2026), 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>India(2024)</label><mixed-citation>
      
India: ICRISAT. District Level Database,
<a href="http://data.icrisat.org/dld/src/crops.html" target="_blank"/> (last access:  9 February 2024), 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>Johnson(2016)</label><mixed-citation>
      
Johnson, D. M.: A comprehensive assessment of the correlations between field
crop yields and commonly used MODIS products, Int. J.
Appl. Earth Obs., 52, 65–81,
<a href="https://doi.org/10.1016/j.jag.2016.05.010" target="_blank">https://doi.org/10.1016/j.jag.2016.05.010</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>Kallenberg et al.(2025)</label><mixed-citation>
      
Kallenberg, M., Paudel, D., Ofori-Ampofo, S., Baja, H., van Bree, R., Potze,  A., Poudel, P., Saleh, A., Anderson, W., von Bloh, M., Castellano, A.,  Ennaji, O., Hamed, R., Laudien, R., Lee, D., Luna, I., Masiliūnas, D.,  Meroni, M., Mutuku, J. M., Mkuhlani, S., Richetti, J., Ruane, A. C.,  Sahajpal, R., Shuai, G., Sitokonstantinou, V., de Souza Noia Junior, R.,  Srivastava, A. K., Strong, R., Sweet, L.-b., Vojnović, P., de Wit, A.,  Zachow, M., and Athanasiadis, I. N.: CY-Bench: A comprehensive benchmark  dataset for subnational crop yield forecasting, Zenodo [data set],  <a href="https://doi.org/10.5281/zenodo.11502142" target="_blank">https://doi.org/10.5281/zenodo.11502142</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>Kallenberg et al.(2026)</label><mixed-citation>
      
Kallenberg, M., Paudel, D., Ofori-Ampofo, S., Baja, H., van Bree, R., Potze, A., Poudel, P., Saleh, A., Anderson, W., von Bloh, M., Castellano, A., Ennaji, O., Hamed, R., Laudien, R., Lee, D., Luna, I., Masiliunas, D., Meroni, M., Mutuku, J. M., Mkuhlani, S., Richetti, J., Ruane, A. C., Sahajpal, R., Shuai, G., Sitokonstantinou, V., de Souza Noia Junior, R., Srivastava, A. K., Strong, R., Sweet, L.-b., Vojnovic, P., de Wit, A., Zachow, M., and Athanasiadis, I. N. : WUR-AI/AgMLCY-Bench: CY-Bench v1.0.0: ESSD paper, Zenodo [code], <a href="https://doi.org/10.5281/zenodo.20456375" target="_blank">https://doi.org/10.5281/zenodo.20456375</a>, 2026

    </mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>Kamilaris and
Prenafeta-Boldú(2018)</label><mixed-citation>
      
Kamilaris, A. and Prenafeta-Boldú, F. X.: Deep learning in agriculture: A
survey, Comput. Electron. Agr., 147, 70–90,
<a href="https://doi.org/10.1016/j.compag.2018.02.016" target="_blank">https://doi.org/10.1016/j.compag.2018.02.016</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>Kapoor and Narayanan(2023)</label><mixed-citation>
      
Kapoor, S. and Narayanan, A.: Leakage and the reproducibility crisis in
machine-learning-based science, Patterns, 4, 100804,
<a href="https://doi.org/10.1016/j.patter.2023.100804" target="_blank">https://doi.org/10.1016/j.patter.2023.100804</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>Kebede et al.(2025)Kebede, Oluoch, Siebert, Mehta, Hartman,
Jägermeyr, Ray, Ali, Brauman, Deng et al.</label><mixed-citation>
      
Kebede, E. A., Oluoch, K. O., Siebert, S., Mehta, P., Hartman, S.,  Jägermeyr, J., Ray, D., Ali, T., Brauman, K. A., Deng, Q., Xie, W., and Davis, K. F.: A global open-source dataset of monthly irrigated and rainfed cropped areas (MIRCA-OS) for the 21st century, Sci. Data, 12, 208, <a href="https://doi.org/10.1038/s41597-024-04313-w" target="_blank">https://doi.org/10.1038/s41597-024-04313-w</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>Kerner et al.(2020)Kerner, Tseng, Becker-Reshef, Nakalembe, Barker,
Munshell, Paliyam, and Hosseini</label><mixed-citation>
      
Kerner, H., Tseng, G., Becker-Reshef, I., Nakalembe, C., Barker, B., Munshell,
B., Paliyam, M., and Hosseini, M.: Rapid Response Crop Maps in Data Sparse
Regions, in: ACM SIGKDD Conference on Data Mining and Knowledge Discovery
Workshops, arXiv, <a href="https://doi.org/10.48550/arXiv.2006.16866" target="_blank">https://doi.org/10.48550/arXiv.2006.16866</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>Khaki et al.(2020)Khaki, Wang, and Archontoulis</label><mixed-citation>
      
Khaki, S., Wang, L., and Archontoulis, S. V.: A CNN-RNN framework for crop
yield prediction, Front. Plant Sci., 10, 1750,
<a href="https://doi.org/10.3389/fpls.2019.01750" target="_blank">https://doi.org/10.3389/fpls.2019.01750</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>Kondmann et al.(2021)Kondmann, Toker, Ruß wurm, Camero, Peressuti,
Milcinski, Mathieu, Longepe, Davis, Marchisio, Leal-Taixé, and
Zhu</label><mixed-citation>
      
Kondmann, L., Toker, A., Ruß wurm, M., Camero, A., Peressuti, D., Milcinski, G., Mathieu, P.-P., Longepe, N., Davis, T., Marchisio, G., Leal-Taixé, L., and Zhu, X.: DENETHOR: The DynamicEarthNET dataset for Harmonized, inter-Operable, analysis-Ready, daily crop monitoring from space, in: Proceedings of the Neural Information Processing Systems Track on Datasets and Benchmarks, edited by: Vanschoren, J. and Yeung, S., Vol. 1, Curran, <a href="https://openreview.net/pdf?id=uUa4jNMLjrL" target="_blank"/> (last access: 30 May 2026), 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>Koukos et al.(2024)</label><mixed-citation>
      
Koukos, A., Jo, H.-W., Sitokonstantinou, V., Tsoumas, I., Kontoes, C., and Lee, W.-K.: Towards Global Crop Maps with Transfer Learning, in: IGARSS 2024–2024 IEEE International Geoscience and Remote Sensing Symposium, 1540–1545, IEEE, <a href="https://doi.org/10.1109/IGARSS53475.2024.10641793" target="_blank">https://doi.org/10.1109/IGARSS53475.2024.10641793</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib51"><label>Lawes et al.(2022)Lawes, Mata, Richetti, Fletcher, and
Herrmann</label><mixed-citation>
      
Lawes, R., Mata, G., Richetti, J., Fletcher, A., and Herrmann, C.: Using remote
sensing, process-based crop models, and machine learning to evaluate crop
rotations across 20 million hectares in Western Australia, Agron.
Sustain. Dev., 42, 120, <a href="https://doi.org/10.1007/s13593-022-00851-y" target="_blank">https://doi.org/10.1007/s13593-022-00851-y</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib52"><label>Lecerf et al.(2019)Lecerf, Ceglar, López-Lozano, Van Der Velde,
and Baruth</label><mixed-citation>
      
Lecerf, R., Ceglar, A., López-Lozano, R., Van Der Velde, M., and Baruth,
B.: Assessing the information in crop model and meteorological indicators to
forecast crop yield over Europe, Agr. Syst., 168, 191–202,
<a href="https://doi.org/10.1016/j.agsy.2018.03.002" target="_blank">https://doi.org/10.1016/j.agsy.2018.03.002</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib53"><label>Lee et al.(2022)Lee, Davenport, Shukla, Husak, Funk, Harrison,
McNally, Rowland, Budde, and Verdin</label><mixed-citation>
      
Lee, D., Davenport, F., Shukla, S., Husak, G., Funk, C., Harrison, L., McNally,
A., Rowland, J., Budde, M., and Verdin, J.: Maize yield forecasts for
Sub-Saharan Africa using Earth Observation data and machine learning, Glob. Food Secur., 33, 100643, <a href="https://doi.org/10.1016/j.gfs.2022.100643" target="_blank">https://doi.org/10.1016/j.gfs.2022.100643</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib54"><label>Lee et al.(2025)</label><mixed-citation>
      
Lee, D., Anderson, W., Chen, X., Davenport, F., Shukla, S., Sahajpal, R.,  Budde, M., Rowland, J., Verdin, J., You, L., Ahouangbenon, M., Davis, K. F., Kebede, E., Ehrmann, S., Justice, C., and Meyer, C.: HarvestStat  Africa–harmonized subnational crop statistics for sub-Saharan Africa, Sci. Data, 12, 690, <a href="https://doi.org/10.1038/s41597-025-05001-z" target="_blank">https://doi.org/10.1038/s41597-025-05001-z</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib55"><label>Lesk et al.(2022)Lesk, Anderson, Rigden, Coast, Jägermeyr, McDermid,
Davis, and Konar</label><mixed-citation>
      
Lesk, C., Anderson, W., Rigden, A., Coast, O., Jägermeyr, J., McDermid, S.,
Davis, K. F., and Konar, M.: Compound heat and moisture extreme impacts on
global crop yields under climate change, Nat. Rev. Earth  Environ.,
3, 872–889, <a href="https://doi.org/10.1038/s43017-022-00368-8" target="_blank">https://doi.org/10.1038/s43017-022-00368-8</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib56"><label>Liakos et al.(2018)Liakos, Busato, Moshou, Pearson, and
Bochtis</label><mixed-citation>
      
Liakos, K., Busato, P., Moshou, D., Pearson, S., and Bochtis, D.: Machine
learning in agriculture: A review, Sensors, 18, 2674,
<a href="https://doi.org/10.3390/s18082674" target="_blank">https://doi.org/10.3390/s18082674</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib57"><label>Liliane and Charles(2020)</label><mixed-citation>
      
Liliane, T. N. and Charles, M. S.: Factors Affecting Yield of Crops, in:
Agronomy, edited by: Amanullah, Chap. 2, IntechOpen, Rijeka,
<a href="https://doi.org/10.5772/intechopen.90672" target="_blank">https://doi.org/10.5772/intechopen.90672</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib58"><label>Lin et al.(2024)Lin, Guillot, Crawford, Zhang, Yuan, and
Tzeng</label><mixed-citation>
      
Lin, F., Guillot, K., Crawford, S., Zhang, Y., Yuan, X., and Tzeng, N.-F.: An
Open and Large-Scale Dataset for Multi-Modal Climate Change-aware Crop Yield
Predictions, in: Proceedings of the 30th ACM SIGKDD Conference on Knowledge
Discovery and Data Mining,  5375–5386, ACM,
<a href="https://doi.org/10.1145/3637528.3671536" target="_blank">https://doi.org/10.1145/3637528.3671536</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib59"><label>Liu et al.(2022)Liu, Yang, Mohammadi, Song, Bi, and
Wang</label><mixed-citation>
      
Liu, Q., Yang, M., Mohammadi, K., Song, D., Bi, J., and Wang, G.: Machine
Learning Crop Yield Models Based on Meteorological Features and
Comparison with a Process-Based Model, Artificial Intelligence for
the Earth Systems, 1, <a href="https://doi.org/10.1175/AIES-D-22-0002.1" target="_blank">https://doi.org/10.1175/AIES-D-22-0002.1</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib60"><label>López et al.(2021)López, Way, and Sadok</label><mixed-citation>
      
López, J., Way, D. A., and Sadok, W.: Systemic effects of rising
atmospheric vapor pressure deficit on plant physiology and productivity,
Glob. Change Biol., 27, 1704–1720, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib61"><label>Ma et al.(2023)Ma, Yang, Huang, and Zhang</label><mixed-citation>
      
Ma, Y., Yang, Z., Huang, Q., and Zhang, Z.: Improving the Transferability of
Deep Learning Models for Crop Yield Prediction: A Partial
Domain Adaptation Approach, Remote Sens., 15,
<a href="https://doi.org/10.3390/rs15184562" target="_blank">https://doi.org/10.3390/rs15184562</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib62"><label>Mateo-Sanchis et al.(2021)Mateo-Sanchis, Piles, Amorós-López,
Muñoz-Marí, Adsuara, Moreno-Martínez, and
Camps-Valls</label><mixed-citation>
      
Mateo-Sanchis, A., Piles, M., Amorós-López, J., Muñoz-Marí,
J., Adsuara, J. E., Moreno-Martínez, Á., and Camps-Valls, G.:
Learning main drivers of crop progress and failure in Europe with
interpretable machine learning, Int. J. Appl. Earth
Obs., 104, 102574,
<a href="https://doi.org/10.1016/j.jag.2021.102574" target="_blank">https://doi.org/10.1016/j.jag.2021.102574</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib63"><label>Mehrabi et al.(2022)Mehrabi, Delzeit, Ignaciuk, Levers, Braich,
Bajaj, Amo-Aidoo, Anderson, Balgah, Benton, Chari, Ellis, Gahi, Gaupp,
Garibaldi, Gerber, Godde, Grass, Heimann, Hirons, Hoogenboom, Jain, James,
Makowski, Masamha, Meng, Monprapussorn, Müller, Nelson, Newlands, Noack,
Oronje, Raymond, Reichstein, Rieseberg, Rodriguez-Llanes, Rosenstock,
Rowhani, Sarhadi, Seppelt, Sidhu, Snapp, Soma, Sparks, Teh, Tigchelaar,
Vogel, West, Wittman, and You</label><mixed-citation>
      
Mehrabi, Z., Delzeit, R., Ignaciuk, A., Levers, C., Braich, G., Bajaj, K.,
Amo-Aidoo, A., Anderson, W., Balgah, R. A., Benton, T. G., Chari, M. M.,
Ellis, E. C., Gahi, N. Z., Gaupp, F., Garibaldi, L. A., Gerber, J. S., Godde,
C. M., Grass, I., Heimann, T., Hirons, M., Hoogenboom, G., Jain, M., James,
D., Makowski, D., Masamha, B., Meng, S., Monprapussorn, S., Müller, D.,
Nelson, A., Newlands, N. K., Noack, F., Oronje, M., Raymond, C., Reichstein,
M., Rieseberg, L. H., Rodriguez-Llanes, J. M., Rosenstock, T., Rowhani, P.,
Sarhadi, A., Seppelt, R., Sidhu, B. S., Snapp, S., Soma, T., Sparks, A. H.,
Teh, L., Tigchelaar, M., Vogel, M. M., West, P. C., Wittman, H., and You, L.:
Research priorities for global food security under extreme events, One Earth,
5, 756–766, <a href="https://doi.org/10.1016/j.oneear.2022.06.008" target="_blank">https://doi.org/10.1016/j.oneear.2022.06.008</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib64"><label>Meroni et al.(2019)Meroni, Fasbender, Rembold, Atzberger, and
Klisch</label><mixed-citation>
      
Meroni, M., Fasbender, D., Rembold, F., Atzberger, C., and Klisch, A.: Near
real-time vegetation anomaly detection with MODIS NDVI: Timeliness vs.
accuracy and effect of anomaly computation options, Remote Sens.
Environ., 221, 508–521, <a href="https://doi.org/10.1016/j.rse.2018.11.041" target="_blank">https://doi.org/10.1016/j.rse.2018.11.041</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib65"><label>Meroni et al.(2021)Meroni, Waldner, Seguini, Kerdiles, and
Rembold</label><mixed-citation>
      
Meroni, M., Waldner, F., Seguini, L., Kerdiles, H., and Rembold, F.: Yield
forecasting with machine learning and small data: What gains for grains?,
Agr. Forest Meteorol., 308, 108555,
<a href="https://doi.org/10.1016/j.agrformet.2021.108555" target="_blank">https://doi.org/10.1016/j.agrformet.2021.108555</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib66"><label>Mexico(2019)</label><mixed-citation>
      
Mexico: INEGI. Agricultural Census and Survey Data,
<a href="https://www.inegi.org.mx" target="_blank"/> (last access: 10 April 2024), 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib67"><label>Meyer and Pebesma(2022)</label><mixed-citation>
      
Meyer, H. and Pebesma, E.: Machine learning-based global maps of ecological
variables and the challenge of assessing them, Nat. Commun., 13,
2208, <a href="https://doi.org/10.1038/s41467-022-29838-9" target="_blank">https://doi.org/10.1038/s41467-022-29838-9</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib68"><label>Minoli et al.(2019)Minoli, Egli, Rolinski, and
Müller</label><mixed-citation>
      
Minoli, S., Egli, D. B., Rolinski, S., and Müller, C.: Modelling cropping
periods of grain crops at the global scale, Global Planet. Change, 174,
35–46, <a href="https://doi.org/10.1016/j.gloplacha.2018.12.013" target="_blank">https://doi.org/10.1016/j.gloplacha.2018.12.013</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib69"><label>Miralles et al.(2025)</label><mixed-citation>
      
Miralles, D. G., Bonte, O., Koppa, A., Baez-Villanueva, O. M., Tronquo, E.,  Zhong, F., Beck, H. E., Hulsman, P., Dorigo, W., Verhoest, N. E., and Haghdoost, S.: GLEAM4: global land evaporation and soil moisture dataset at 0.1 resolution from 1980 to near present, Sci. Data, 12, 416, <a href="https://doi.org/10.1038/s41597-025-04610-y" target="_blank">https://doi.org/10.1038/s41597-025-04610-y</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib70"><label>Mitrovic et al.(2020)Mitrovic, McWilliams, Walker, Buesing, and
Blundell</label><mixed-citation>
      
Mitrovic, J., McWilliams, B., Walker, J., Buesing, L., and Blundell, C.:
Representation learning via invariant causal mechanisms, arXiv [preprint],
<a href="https://doi.org/10.48550/arXiv.2010.07922" target="_blank">https://doi.org/10.48550/arXiv.2010.07922</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib71"><label>Nakalembe and Kerner(2023)</label><mixed-citation>
      
Nakalembe, C. and Kerner, H.: Considerations for AI-EO for agriculture in
Sub-Saharan Africa, Environ. Res. Lett., 18, 041002,
<a href="https://doi.org/10.1088/1748-9326/acc476" target="_blank">https://doi.org/10.1088/1748-9326/acc476</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib72"><label>Neophytides et al.(2024)</label><mixed-citation>
      
Neophytides, S. P., Tsoumas, I., Tsalakou, A., Christoforou, M.,  Mavrovouniotis, M., Eliades, M., Papoutsa, C., Kontoes, C., and Hadjimitsis,  D. G.: Invariant learning as a pathway to robust potato yield prediction, in:  Remote Sensing for Agriculture, Ecosystems, and Hydrology XXVI, SPIE, 13191, 33–42, <a href="https://doi.org/10.1117/12.3031554" target="_blank">https://doi.org/10.1117/12.3031554</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib73"><label>Nowakowski et al.(2021)Nowakowski, Mrziglod, Spiller, Bonifacio,
Ferrari, Mathieu, Garcia-Herranz, and Kim</label><mixed-citation>
      
Nowakowski, A., Mrziglod, J., Spiller, D., Bonifacio, R., Ferrari, I., Mathieu, P. P., Garcia-Herranz, M., and Kim, D.-H.: Crop type mapping by using transfer learning, Int. J. Appl. Earth Obs., 98, 102313, <a href="https://doi.org/10.1016/j.jag.2021.102313" target="_blank">https://doi.org/10.1016/j.jag.2021.102313</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib74"><label>Oikonomidis et al.(2022)Oikonomidis, Catal, and
Kassahun</label><mixed-citation>
      
Oikonomidis, A., Catal, C., and Kassahun, A.: Deep learning for crop yield
prediction: a systematic literature review, New Zeal. J. Crop
Hort.,  1–26, <a href="https://doi.org/10.1080/01140671.2022.2032213" target="_blank">https://doi.org/10.1080/01140671.2022.2032213</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib75"><label>Paudel et al.(2021)Paudel, Boogaard, de Wit, Janssen, Osinga,
Pylianidis, and Athanasiadis</label><mixed-citation>
      
Paudel, D., Boogaard, H., de Wit, A., Janssen, S., Osinga, S., Pylianidis, C.,
and Athanasiadis, I. N.: Machine learning for large-scale crop yield
forecasting, Agr. Syst., 187, 103016,
<a href="https://doi.org/10.1016/j.agsy.2020.103016" target="_blank">https://doi.org/10.1016/j.agsy.2020.103016</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib76"><label>Paudel et al.(2022)Paudel, Boogaard, de Wit, van der Velde, Claverie,
Nisini, Janssen, Osinga, and Athanasiadis</label><mixed-citation>
      
Paudel, D., Boogaard, H., de Wit, A., van der Velde, M., Claverie, M., Nisini,
L., Janssen, S., Osinga, S., and Athanasiadis, I. N.: Machine learning for
regional crop yield forecasting in Europe, Field Crop. Res., 276,
108377, <a href="https://doi.org/10.1016/j.fcr.2021.108377" target="_blank">https://doi.org/10.1016/j.fcr.2021.108377</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib77"><label>Paudel et al.(2023)Paudel, Marcos, de Wit, Boogaard, and
Athanasiadis</label><mixed-citation>
      
Paudel, D., Marcos, D., de Wit, A., Boogaard, H., and Athanasiadis, I. N.: A
weakly supervised framework for high-resolution crop yield forecasts,
Environ. Res. Lett., 18, 094062, <a href="https://doi.org/10.1088/1748-9326/acf50e" target="_blank">https://doi.org/10.1088/1748-9326/acf50e</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib78"><label>Paudel et al.(2023b)Paudel, Marcos, de Wit, Boogaard, and
Athanasiadis</label><mixed-citation>
      
Paudel, D. R., Marcos, D., de Wit, A., Boogaard, H., and Athanasiadis, I. N.: A
weakly supervised framework for high resolution crop yield forecasts,
Environ. Res. Lett., 18, 094062, <a href="https://doi.org/10.1088/1748-9326/acf50e" target="_blank">https://doi.org/10.1088/1748-9326/acf50e</a>,
2023b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib79"><label>Pelletier et al.(2019)Pelletier, Webb, and
Petitjean</label><mixed-citation>
      
Pelletier, C., Webb, G. I., and Petitjean, F.: Temporal Convolutional Neural
Network for the Classification of Satellite Image Time Series, Remote
Sensing, 11, <a href="https://doi.org/10.3390/rs11050523" target="_blank">https://doi.org/10.3390/rs11050523</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib80"><label>Poggio et al.(2021)Poggio, De Sousa, Batjes, Heuvelink, Kempen,
Ribeiro, and Rossiter</label><mixed-citation>
      
Poggio, L., de Sousa, L. M., Batjes, N. H., Heuvelink, G. B. M., Kempen, B., Ribeiro, E., and Rossiter, D.: SoilGrids 2.0: producing soil information for the globe with quantified spatial uncertainty, SOIL, 7, 217–240, <a href="https://doi.org/10.5194/soil-7-217-2021" target="_blank">https://doi.org/10.5194/soil-7-217-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib81"><label>Portmann et al.(2010)Portmann, Siebert, and
Döll</label><mixed-citation>
      
Portmann, F. T., Siebert, S., and Döll, P.: MIRCA2000 – Global monthly
irrigated and rainfed crop areas around the year 2000: A new high-resolution
data set for agricultural and hydrological modeling, Global Biogeochem.
Cy., 24, <a href="https://doi.org/10.1029/2008GB003435" target="_blank">https://doi.org/10.1029/2008GB003435</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib82"><label>Potter(2019)</label><mixed-citation>
      
Potter, N. A.: rnassqs: An “R” package to access agricultural data via the USDA National Agricultural Statistics Service (USDA-NASS) “Quick Stats” API, Journal of Open Source Software, 4, 1880<a href="https://doi.org/10.21105/joss.01880" target="_blank">https://doi.org/10.21105/joss.01880</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib83"><label>Priyatikanto et al.(2023)Priyatikanto, Lu, Dash, and
Sheffield</label><mixed-citation>
      
Priyatikanto, R., Lu, Y., Dash, J., and Sheffield, J.: Improving
generalisability and transferability of machine-learning-based maize yield
prediction model through domain adaptation, Agr. Forest
Meteorol., 341, 109652, <a href="https://doi.org/10.1016/j.agrformet.2023.109652" target="_blank">https://doi.org/10.1016/j.agrformet.2023.109652</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib84"><label>Pushkarna et al.(2022)Pushkarna, Zaldivar, and
Kjartansson</label><mixed-citation>
      
Pushkarna, M., Zaldivar, A., and Kjartansson, O.: Data Cards: Purposeful and
transparent dataset documentation for responsible AI, in: Proceedings of the
2022 ACM Conference on Fairness, Accountability, and Transparency,
1776–1826, <a href="https://doi.org/10.1145/3531146.3533231" target="_blank">https://doi.org/10.1145/3531146.3533231</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib85"><label>Richards et al.(2023)Richards, Kirichenko, Bouchacourt, and
Ibrahim</label><mixed-citation>
      
Richards, M., Kirichenko, P., Bouchacourt, D., and Ibrahim, M.: Does Progress
On Object Recognition Benchmarks Improve Real-World
Generalization?, arXiv, <a href="https://doi.org/10.48550/arXiv.2307.13136" target="_blank">https://doi.org/10.48550/arXiv.2307.13136</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib86"><label>Richetti et al.(2023)Richetti, Diakogianis, Bender, Colaço, and
Lawes</label><mixed-citation>
      
Richetti, J., Diakogianis, F. I., Bender, A., Colaço, A. F., and Lawes,
R. A.: A methods guideline for deep learning for tabular data in agriculture
with a case study to forecast cereal yield, Comput. Electron.
Agr., 205, 107642, <a href="https://doi.org/10.1016/j.compag.2023.107642" target="_blank">https://doi.org/10.1016/j.compag.2023.107642</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib87"><label>Rodell et al.(2004)Rodell, Houser, Jambor, Gottschalck, Mitchell,
Meng, Arsenault, Cosgrove, Radakovich, Bosilovich et al.</label><mixed-citation>
      
Rodell, M., Houser, P., Jambor, U., Gottschalck, J., Mitchell, K., Meng, C.-J., Arsenault, K., Cosgrove, B., Radakovich, J., Bosilovich, M., Entin, J. K., Walker, J. P., Lohmann, D., and Toll, D.: The global land data assimilation system, B. Am. Meteorol. Soc., 85, 381–394, <a href="https://doi.org/10.1175/BAMS-85-3-381" target="_blank">https://doi.org/10.1175/BAMS-85-3-381</a>, 2004.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib88"><label>Rolnick et al.(2024)Rolnick, Aspuru-Guzik, Beery, Dilkina, Donti,
Ghassemi, Kerner, Monteleoni, Rolf, Tambe, and White</label><mixed-citation>
      
Rolnick, D., Aspuru-Guzik, A., Beery, S., Dilkina, B., Donti, P. L., Ghassemi,
M., Kerner, H., Monteleoni, C., Rolf, E., Tambe, M., and White, A.:
Application-Driven Innovation in Machine Learning, arXiv,
<a href="https://doi.org/10.48550/arXiv.2403.17381" target="_blank">https://doi.org/10.48550/arXiv.2403.17381</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib89"><label>Ronchetti et al.(2024)Ronchetti, Nisini Scacchiafichi, Seguini,
Cerrani, and van der Velde</label><mixed-citation>
      
Ronchetti, G., Nisini Scacchiafichi, L., Seguini, L., Cerrani, I., and van der Velde, M.: Harmonized European Union subnational crop statistics can reveal climate impacts and crop cultivation shifts, Earth Syst. Sci. Data, 16, 1623–1649, <a href="https://doi.org/10.5194/essd-16-1623-2024" target="_blank">https://doi.org/10.5194/essd-16-1623-2024</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib90"><label>Rußwurm et al.(2019)Rußwurm, Lefèvre, and
Körner</label><mixed-citation>
      
Rußwurm, M., Lefèvre, S., and Körner, M.: BreizhCrops: A Satellite
Time Series Dataset for Crop Type Identification, arXiv,
<a href="https://doi.org/10.48550/arXiv.1905.11893" target="_blank">https://doi.org/10.48550/arXiv.1905.11893</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib91"><label>Rußwurm and Körner(2018)</label><mixed-citation>
      
Rußwurm, M. and Körner, M.: Multi-Temporal Land Cover Classification with
Sequential Recurrent Encoders, ISPRS Int. J. Geo-Inf., 7, <a href="https://doi.org/10.3390/ijgi7040129" target="_blank">https://doi.org/10.3390/ijgi7040129</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib92"><label>Sacks et al.(2010)Sacks, Deryng, Foley, and
Ramankutty</label><mixed-citation>
      
Sacks, W. J., Deryng, D., Foley, J. A., and Ramankutty, N.: Crop planting
dates: an analysis of global patterns, Global Ecol. Biogeogr., 19,
607–620, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib93"><label>Sainte Fare Garnot et al.(2020)Sainte Fare Garnot, Landrieu,
Giordano, and Chehata</label><mixed-citation>
      
Sainte Fare Garnot, V., Landrieu, L., Giordano, S., and Chehata, N.: Satellite
Image Time Series Classification with Pixel-Set Encoders and Temporal
Self-Attention, CVPR, <a href="https://doi.org/10.1109/CVPR42600.2020.01234" target="_blank">https://doi.org/10.1109/CVPR42600.2020.01234</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib94"><label>Schauberger et al.(2020)Schauberger, Jägermeyr, and
Gornott</label><mixed-citation>
      
Schauberger, B., Jägermeyr, J., and Gornott, C.: A systematic review of
local to regional yield forecasting approaches and frequently used data
resources, Eur. J. Agron., 120, 126153,
<a href="https://doi.org/10.1016/j.eja.2020.126153" target="_blank">https://doi.org/10.1016/j.eja.2020.126153</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib95"><label>Schlenker and Roberts(2009)</label><mixed-citation>
      
Schlenker, W. and Roberts, M. J.: Nonlinear temperature effects indicate severe
damages to U.S. crop yields under climate change, P.
Natl. Acad. Sci., 106, 15594–15598,
<a href="https://doi.org/10.1073/pnas.0906865106" target="_blank">https://doi.org/10.1073/pnas.0906865106</a>, 2009.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib96"><label>Schneider et al.(2023a)</label><mixed-citation>
      
Schneider, K. R., Fanzo, J., Haddad, L., Herrero, M., Moncayo, J. R., Herforth, A., Remans, R., Guarin, A., Resnick, D., Covic, N., Béné, C., Cattaneo, A., Aburto, N., Ambikapathi, R., Aytekin, D., Barquera, S., Battersby, J., Beal, T., Molina, P. B., Cafiero, C., Campeau, C., Caron, P., Conforti, P., Damerau, K., Di Girolamo, M., DeClerck, F., Dewi, D., Elouafi, I., Fabi, C., Foley, P., Frazier, T. J., Gephart, J., Golden, C., Fischer, C. G., Hendriks, S., Honorati, M., Huang, J., Kennedy, G., Laar, A., Lal, R., Lidder, P., Loken, B., Marshall, Q., Masuda, Y. J., McLaren, R., Miachon, L., Muñoz, H., Nordhagen, S., Qayyum, N., Saisana, M., Suhardiman, D., Sumaila, U. R., Cullen, M. T., Tubiello, F. N., Vivero-Pol, J.-L., Webb, P., and Wiebe, K.: The state of food systems worldwide in the countdown to 2030, Nature Food, 4, 1090–1110, <a href="https://doi.org/10.1038/s43016-023-00885-9" target="_blank">https://doi.org/10.1038/s43016-023-00885-9</a>, 2023a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib97"><label>Schneider et al.(2023b)Schneider, Schelte, Schmitz
et al.</label><mixed-citation>
      
Schneider, M., Schelte, T., Schmitz, F., and Körner, M.: EuroCrops: The Largest Harmonized Open Crop Dataset Across the European Union, Sci. Data, 10, 612, <a href="https://doi.org/10.1038/s41597-023-02517-0" target="_blank">https://doi.org/10.1038/s41597-023-02517-0</a>, 2023b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib98"><label>Seguini et al.(2026)Seguini, Klisch, Meroni, Vrieling, Manfron,
Atzberger, and Rembold</label><mixed-citation>
      
Seguini, L., Klisch, A., Meroni, M., Vrieling, A., Manfron, G., Atzberger, C., and Rembold, F.: Global near real-time 500&thinsp;m 10&thinsp;d FPAR dataset from MODIS and VIIRS for operational agricultural monitoring and crop yield forecasting, Earth Syst. Sci. Data, 18, 309–331, <a href="https://doi.org/10.5194/essd-18-309-2026" target="_blank">https://doi.org/10.5194/essd-18-309-2026</a>, 2026.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib99"><label>Seidel et al.(2018)Seidel, Palosuo, Thorburn, and
Wallach</label><mixed-citation>
      
Seidel, S., Palosuo, T., Thorburn, P., and Wallach, D.: Towards improved
calibration of crop models – Where are we now and where should we go?,
Eur. J. Agron., 94, 25–35,
<a href="https://doi.org/10.1016/j.eja.2018.01.006" target="_blank">https://doi.org/10.1016/j.eja.2018.01.006</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib100"><label>Singh et al.(2022)</label><mixed-citation>
      
Singh, K., Singh, D., Goroshi, S., Yashu, S., Kumar, Y., Solanki, S., and  Sagar, S.: Crop Yield forecasting under FASAL (Forecasting Agricultural  output using Space Agrometeorology and Land based observations), Tech. rep., India Meteorological Department (IMD), Ministry of Earth Sciences (MoES), Government of India, <a href="https://doi.org/10.13140/RG.2.2.11593.42083" target="_blank">https://doi.org/10.13140/RG.2.2.11593.42083</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib101"><label>Stuart et al.(2024)Stuart, Hobbins, Niebuhr, Ruane, Pulwarty, Hoell,
Thiaw, Rosenzweig, Muñoz-Arriola, Jahn et al.</label><mixed-citation>
      
Stuart, L., Hobbins, M., Niebuhr, E., Ruane, A. C., Pulwarty, R., Hoell, A.,  Thiaw, W., Rosenzweig, C., Muñoz-Arriola, F., Jahn, M., and Farrar, M.: Enhancing Global Food Security: Opportunities for the American  Meteorological Society, B. Am. Meteorol. Soc., 104, E760–E777, <a href="https://doi.org/10.1175/BAMS-D-22-0106.1" target="_blank">https://doi.org/10.1175/BAMS-D-22-0106.1</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib102"><label>Sweet et al.(2023)Sweet, Müller, Anand, and
Zscheischler</label><mixed-citation>
      
Sweet, L.-b., Müller, C., Anand, M., and Zscheischler, J.: Cross-Validation
Strategy Impacts the Performance and Interpretation of Machine
Learning Models, Artificial Intelligence for the Earth Systems, 2,
<a href="https://doi.org/10.1175/AIES-D-23-0026.1" target="_blank">https://doi.org/10.1175/AIES-D-23-0026.1</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib103"><label>Sweet et al.(2025)Sweet, Athanasiadis, van Bree, Castellano, Martre,
Paudel, Ruane, and Zscheischler</label><mixed-citation>
      
Sweet, L. B., Athanasiadis, I. N., van Bree, R., Castellano, A., Martre, P.,
Paudel, D., Ruane, A. C., and Zscheischler, J.: Transdisciplinary
coordination is essential for advancing agricultural modeling with machine
learning, One Earth, <a href="https://doi.org/10.1016/j.oneear.2025.101233" target="_blank">https://doi.org/10.1016/j.oneear.2025.101233</a>,
2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib104"><label>Tadesse et al.(2015)Tadesse, Senay, Berhan, Regassa, and
Beyene</label><mixed-citation>
      
Tadesse, T., Senay, G. B., Berhan, G., Regassa, T., and Beyene, S.: Evaluating
a satellite-based seasonal evapotranspiration product and identifying its
relationship with other satellite-derived products and crop yield: A case
study for Ethiopia, Int. J. Applied Earth Obs., 40, 39–54, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib105"><label>Tanaka et al.(2023)Tanaka, Sun, Becker-Reshef, Song, and
Puricelli</label><mixed-citation>
      
Tanaka, T., Sun, L., Becker-Reshef, I., Song, X.-P., and Puricelli, E.:
Satellite forecasting of crop harvest can trigger a cross-hemispheric
production response and improve global food security, Commun. Earth
Environ., 4, 1–9, <a href="https://doi.org/10.1038/s43247-023-00992-2" target="_blank">https://doi.org/10.1038/s43247-023-00992-2</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib106"><label>Thomas and Uminsky(2022)</label><mixed-citation>
      
Thomas, R. L. and Uminsky, D.: Reliance on metrics is a fundamental challenge
for AI, Patterns, 3, 100476, <a href="https://doi.org/10.1016/j.patter.2022.100476" target="_blank">https://doi.org/10.1016/j.patter.2022.100476</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib107"><label>Tsaftaris and Scharr(2019)</label><mixed-citation>
      
Tsaftaris, S. A. and Scharr, H.: Sharing the Right Data Right: A
Symbiosis with Machine Learning, Trends  Plant Sci., 24, 99–102,
<a href="https://doi.org/10.1016/j.tplants.2018.10.016" target="_blank">https://doi.org/10.1016/j.tplants.2018.10.016</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib108"><label>Tseng et al.(2021a)Tseng, Kerner, Nakalembe, and
Becker-Reshef</label><mixed-citation>
      
Tseng, G., Kerner, H., Nakalembe, C., and Becker-Reshef, I.: Learning to
predict crop type from heterogeneous sparse labels using meta-learning, in:
2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops
(CVPRW), 1111–1120, <a href="https://doi.org/10.1109/CVPRW53098.2021.00122" target="_blank">https://doi.org/10.1109/CVPRW53098.2021.00122</a>,
2021a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib109"><label>Tseng et al.(2021b)Tseng, Zvonkov, Nakalembe, and
Kerner</label><mixed-citation>
      
Tseng, G., Zvonkov, I., Nakalembe, C., and Kerner, H.: CropHarvest: A global  dataset for crop-type classification, in: Proceedings of the Neural  Information Processing Systems Track on Datasets and Benchmarks, edited by:  Vanschoren, J. and Yeung, S., Vol. 1, Curran,
<a href="https://openreview.net/pdf?id=JtjzUXPEaCu" target="_blank"/> (last access: 30 May 2026),  2021b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib110"><label>Tseng et al.(2022)Tseng, Kerner, and Rolnick</label><mixed-citation>
      
Tseng, G., Kerner, H., and Rolnick, D.: TIML: Task-Informed
Meta-Learning for Agriculture, arXiv, <a href="https://doi.org/10.48550/arXiv.2202.02124" target="_blank">https://doi.org/10.48550/arXiv.2202.02124</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib111"><label>Tzachor et al.(2022)Tzachor, Devare, King, Avin, and
Ó hÉigeartaigh</label><mixed-citation>
      
Tzachor, A., Devare, M., King, B., Avin, S., and Ó hÉigeartaigh, S.:
Responsible artificial intelligence in agriculture requires systemic
understanding of risks and externalities, Nature Machine Intelligence, 4,
104–109, <a href="https://doi.org/10.1038/s42256-022-00440-4" target="_blank">https://doi.org/10.1038/s42256-022-00440-4</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib112"><label>van der Velde and Nisini(2019)</label><mixed-citation>
      
van der Velde, M. and Nisini, L.: Performance of the MARS-crop yield
forecasting system for the European Union: Assessing accuracy,
in-season, and year-to-year improvements from 1993 to 2015, Agr.
Syst., 168, 203–212, <a href="https://doi.org/10.1016/j.agsy.2018.06.009" target="_blank">https://doi.org/10.1016/j.agsy.2018.06.009</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib113"><label>Van Klompenburg et al.(2020)Van Klompenburg, Kassahun, and
Catal</label><mixed-citation>
      
Van Klompenburg, T., Kassahun, A., and Catal, C.: Crop yield prediction using
machine learning: A systematic literature review, Comput. Electron.
Agr., 177, 105709, <a href="https://doi.org/10.1016/j.compag.2020.105709" target="_blank">https://doi.org/10.1016/j.compag.2020.105709</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib114"><label>Van Tricht et al.(2023)Van Tricht, Degerickx, Gilliams, Zanaga,
Battude, Grosu, Brombacher, Lesiv, Bayas, Karanam
et al.</label><mixed-citation>
      
Van Tricht, K., Degerickx, J., Gilliams, S., Zanaga, D., Battude, M., Grosu, A., Brombacher, J., Lesiv, M., Bayas, J. C. L., Karanam, S., Fritz, S., Becker-Reshef, I., Franch, B., Mollà-Bononad, B., Boogaard, H., Pratihast, A. K., Koetz, B., and Szantoi, Z.: WorldCereal: a dynamic open-source system for global-scale, seasonal, and reproducible crop and irrigation mapping, Earth Syst. Sci. Data, 15, 5491–5515, <a href="https://doi.org/10.5194/essd-15-5491-2023" target="_blank">https://doi.org/10.5194/essd-15-5491-2023</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib115"><label>Vermote(2015)</label><mixed-citation>
      
Vermote, E.: MOD09CMG MODIS/Terra Surface Reflectance Daily L3 Global 0.05Deg  CMG V006, NASA Land Processes Distributed Active Archive Center [data set], <a href="https://doi.org/10.5067/MODIS/MOD09CMG.006" target="_blank">https://doi.org/10.5067/MODIS/MOD09CMG.006</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib116"><label>Vijverberg et al.(2023)Vijverberg, Hamed, and
Coumou</label><mixed-citation>
      
Vijverberg, S., Hamed, R., and Coumou, D.: Skillful U.S. Soy Yield
Forecasts at Presowing Lead Times, Artificial Intelligence for the
Earth Systems, 2, <a href="https://doi.org/10.1175/AIES-D-21-0009.1" target="_blank">https://doi.org/10.1175/AIES-D-21-0009.1</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib117"><label>Waha et al.(2012)Waha, Van Bussel, Müller, and
Bondeau</label><mixed-citation>
      
Waha, K., Van Bussel, L., Müller, C., and Bondeau, A.: Climate-driven
simulation of global crop sowing dates, Global Ecol. Biogeogr., 21,
247–259, <a href="https://doi.org/10.1111/j.1466-8238.2011.00678.x" target="_blank">https://doi.org/10.1111/j.1466-8238.2011.00678.x</a>, 2012.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib118"><label>Wallach et al.(2021)Wallach, Palosuo, Thorburn, Hochman, Gourdain,
Andrianasolo, Asseng, Basso, Buis, Crout, Dibari, Dumont, Ferrise, Gaiser,
Garcia, Gayler, Ghahramani, Hiremath, Hoek, Horan, Hoogenboom, Huang,
Jabloun, Jansson, Jing, Justes, Kersebaum, Klosterhalfen, Launay, Lewan, Luo,
Maestrini, Mielenz, Moriondo, Nariman Zadeh, Padovan, Olesen, Poyda,
Priesack, Pullens, Qian, Schütze, Shelia, Souissi, Specka, Srivastava,
Stella, Streck, Trombi, Wallor, Wang, Weber, Weihermüller, de Wit,
Wöhling, Xiao, Zhao, Zhu, and Seidel</label><mixed-citation>
      
Wallach, D., Palosuo, T., Thorburn, P., Hochman, Z., Gourdain, E.,
Andrianasolo, F., Asseng, S., Basso, B., Buis, S., Crout, N., Dibari, C.,
Dumont, B., Ferrise, R., Gaiser, T., Garcia, C., Gayler, S., Ghahramani, A.,
Hiremath, S., Hoek, S., Horan, H., Hoogenboom, G., Huang, M., Jabloun, M.,
Jansson, P.-E., Jing, Q., Justes, E., Kersebaum, K. C., Klosterhalfen, A.,
Launay, M., Lewan, E., Luo, Q., Maestrini, B., Mielenz, H., Moriondo, M.,
Nariman Zadeh, H., Padovan, G., Olesen, J. E., Poyda, A., Priesack, E.,
Pullens, J. W. M., Qian, B., Schütze, N., Shelia, V., Souissi, A., Specka,
X., Srivastava, A. K., Stella, T., Streck, T., Trombi, G., Wallor, E., Wang,
J., Weber, T. K., Weihermüller, L., de Wit, A., Wöhling, T., Xiao, L.,
Zhao, C., Zhu, Y., and Seidel, S. J.: The chaos in calibrating crop models:
Lessons learned from a multi-model calibration exercise, Environ.
Model. Softw., 145, 105206,
<a href="https://doi.org/10.1016/j.envsoft.2021.105206" target="_blank">https://doi.org/10.1016/j.envsoft.2021.105206</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib119"><label>Wang et al.(2022)Wang, Albrecht, Braham, Mou, and
Zhu</label><mixed-citation>
      
Wang, Y., Albrecht, C. M., Braham, N. A. A., Mou, L., and Zhu, X. X.:
Self-supervised learning in remote sensing: A review, IEEE Geosci.
Remote S., 10, 213–247, 2022.


    </mixed-citation></ref-html>
<ref-html id="bib1.bib120"><label>Watson(2022)</label><mixed-citation>
      
Watson, P. A. G.: Machine learning applications for weather and climate need
greater focus on extremes, Environ. Res. Lett., 17, 111004,
<a href="https://doi.org/10.1088/1748-9326/ac9d4e" target="_blank">https://doi.org/10.1088/1748-9326/ac9d4e</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib121"><label>Xu et al.(2024)Xu, Ma, and Zhang</label><mixed-citation>
      
Xu, Y., Ma, Y., and Zhang, Z.: Self-supervised pre-training for large-scale
crop mapping using Sentinel-2 time series, ISPRS J. Photogramm., 207, 312–325, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib122"><label>Yeh et al.(2021)</label><mixed-citation>
      
Yeh, C., Meng, C., Wang, S., Driscoll, A., Rozi, E., Liu, P., Lee, J., Burke,  M., Lobell, D., and Ermon, S.: SustainBench: Benchmarks for Monitoring the  Sustainable Development Goals with Machine Learning, in: Thirty-fifth  Conference on Neural Information Processing Systems, Datasets and Benchmarks  Track (Round 2), Curran Associates, Inc., <a href="https://openreview.net/forum?id=5HR3vCylqD" target="_blank"/> (last access: 30 May 2026),  2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib123"><label>You et al.(2017)You, Li, Low, Lobell, and Ermon</label><mixed-citation>
      
You, J., Li, X., Low, M., Lobell, D., and Ermon, S.: Deep Gaussian Process for Crop Yield Prediction Based on Remote Sensing Data, in: Proceedings of the AAAI Conference on Artificial Intelligence, Association for the Advancement of Artificial Intelligence (AAAI), Vol. 31,  <a href="https://doi.org/10.1609/aaai.v31i1.11172" target="_blank">https://doi.org/10.1609/aaai.v31i1.11172</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib124"><label>Zelingher and Makowski(2023)</label><mixed-citation>
      
Zelingher, R. and Makowski, D.: Investigating and forecasting the impact of
crop production shocks on global commodity prices, Environ. Res.
Lett., 19, 014026, <a href="https://doi.org/10.1088/1748-9326/ad0dda" target="_blank">https://doi.org/10.1088/1748-9326/ad0dda</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib125"><label>Zhang et al.(2022)Zhang, van der Wiel, Wei, Screen, Yue, Zheng,
Selten, Bintanja, Anderson, Blackport, Glomsrød, Liu, Cui, and
Yang</label><mixed-citation>
      
Zhang, T., van der Wiel, K., Wei, T., Screen, J., Yue, X., Zheng, B., Selten,
F., Bintanja, R., Anderson, W., Blackport, R., Glomsrød, S., Liu, Y., Cui,
X., and Yang, X.: Increased wheat price spikes and larger economic inequality
with 2&thinsp;°C global warming, One Earth, 5, 907–916,
<a href="https://doi.org/10.1016/j.oneear.2022.07.004" target="_blank">https://doi.org/10.1016/j.oneear.2022.07.004</a>, 2022.

    </mixed-citation></ref-html>--></article>
