<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="research-article">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">GMD</journal-id><journal-title-group>
    <journal-title>Geoscientific Model Development</journal-title>
    <abbrev-journal-title abbrev-type="publisher">GMD</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Geosci. Model Dev.</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1991-9603</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/gmd-19-4703-2026</article-id><title-group><article-title>AIFS Single 1.1.0: an update to ECMWF's machine-learned weather forecast model AIFS</article-title><alt-title>AIFS Single 1.1.0: an update to ECMWF's machine-learned weather forecast model AIFS</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" equal-contrib="yes" corresp="yes" rid="aff1">
          <name><surname>Moldovan</surname><given-names>Gabriel</given-names></name>
          <email>gabriel.moldovan@ecmwf.int</email>
        <ext-link>https://orcid.org/0000-0002-7785-1255</ext-link></contrib>
        <contrib contrib-type="author" equal-contrib="yes" corresp="no" rid="aff1">
          <name><surname>Pinnington</surname><given-names>Ewan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" equal-contrib="yes" corresp="no" rid="aff2">
          <name><surname>Prieto Nemesio</surname><given-names>Ana</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Lang</surname><given-names>Simon</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-3952-586X</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Ben Bouallègue</surname><given-names>Zied</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-2914-4203</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Dramsch</surname><given-names>Jesper</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Alexe</surname><given-names>Mihai</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Santa Cruz</surname><given-names>Mario</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Hahner</surname><given-names>Sara</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-6911-2663</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Cook</surname><given-names>Harrison</given-names></name>
          
        <ext-link>https://orcid.org/0009-0009-3207-4876</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Theissen</surname><given-names>Helen</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Clare</surname><given-names>Mariana</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-5010-0363</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>O'Brien</surname><given-names>Cathal</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Polster</surname><given-names>Jan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Magnusson</surname><given-names>Linus</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-4707-2231</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Mertes</surname><given-names>Gert</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Pinault</surname><given-names>Florian</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-3003-3888</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Raoult</surname><given-names>Baudouin</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>de Rosnay</surname><given-names>Patricia</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-7374-3820</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Forbes</surname><given-names>Richard</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-3596-8287</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Chantry</surname><given-names>Matthew</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-1132-0961</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>European Centre for Medium-Range Weather Forecasts, Shinfield Park, Reading, RG2 9AX, United Kingdom</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>European Centre for Medium-Range Weather Forecasts, Robert-Schuman-Platz 3, 53175 Bonn, Germany</institution>
        </aff><author-comment content-type="econtrib"><p>These authors contributed equally to this work.</p></author-comment>
      </contrib-group>
      <author-notes><corresp id="corr1">Gabriel Moldovan (gabriel.moldovan@ecmwf.int)</corresp></author-notes><pub-date><day>1</day><month>June</month><year>2026</year></pub-date>
      
      <volume>19</volume>
      <issue>10</issue>
      <fpage>4703</fpage><lpage>4724</lpage>
      <history>
        <date date-type="received"><day>24</day><month>September</month><year>2025</year></date>
           <date date-type="rev-request"><day>17</day><month>October</month><year>2025</year></date>
           <date date-type="rev-recd"><day>23</day><month>March</month><year>2026</year></date>
           <date date-type="accepted"><day>22</day><month>April</month><year>2026</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 Gabriel Moldovan et al.</copyright-statement>
        <copyright-year>2026</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026.html">This article is available from https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026.html</self-uri><self-uri xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026.pdf">The full text article is available as a PDF file from https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e272">We present version 1.1.0 of ECMWF's Artificial Intelligence Forecasting System (AIFS Single), operational since 25 February 2025. The revised system introduces a bounding-layer framework that enforces physical constraints, such as non-negativity and internal consistency within precipitation and cloud cover variables, alongside expanded training data, revised loss weighting, and an extended set of surface and atmospheric variables. Overall skill improves by 4 %–6 % in the upper air and near-surface variables without degradation of spatial variability. A controlled comparison shows that training data expansion is the dominant source of upper-air skill gains, highlighting the importance of frequent model updates. The bounding framework delivers the largest precipitation improvements, up to 12 % and an approximately 1 d advantage using a categorical measure of skill. We further show that enforcing precipitation non-negativity resolves a gradient ambiguity at the zero-precipitation boundary under MSE training, explaining the reduction in drizzle bias and the improvements in precipitation.</p>
  </abstract>
    </article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e284">Machine-learned weather forecast models have started to rival or outperform physics-based numerical weather prediction (NWP) models in recent years <xref ref-type="bibr" rid="bib1.bibx27 bib1.bibx17 bib1.bibx19 bib1.bibx7 bib1.bibx3 bib1.bibx20" id="paren.1"/>. For both training and forecasting, these machine-learned forecast models mostly depend on the Copernicus ERA5 reanalysis dataset produced by ECMWF <xref ref-type="bibr" rid="bib1.bibx13" id="paren.2"/> and operational analysis by ECMWF's physics-based integrated forecasting system (IFS).</p>
      <p id="d2e293">ECMWF has developed the artificial intelligence forecasting system (AIFS) <xref ref-type="bibr" rid="bib1.bibx20" id="paren.3"/>, its own machine-learned forecast model. After a successful pre-operational test phase running four times daily since October 2023, with forecasts publicly available under ECMWF's open data policy, AIFS has now transitioned to operational status. The first operational version, AIFS 1.0.0 replacing AIFS 0.2.1, was implemented on 25 February 2025. The current operational version, AIFS 1.1.0 described here, was released on 27 August 2025 to correct a precipitation forecast issue in the initial version. The model is trained with a mean-squared error (MSE) loss function and is referred to as AIFS Single, to distinguish it from the probabilistically trained version, the AIFS ENS <xref ref-type="bibr" rid="bib1.bibx21" id="paren.4"/>.</p>
      <p id="d2e302">Although such MSE-trained forecast models have been shown to smooth forecast fields at longer lead times to avoid the double-penalty of incorrectly positioned weather phenomena <xref ref-type="bibr" rid="bib1.bibx19 bib1.bibx2 bib1.bibx20 bib1.bibx4 bib1.bibx6" id="paren.5"/>, they still display physically robust characteristics <xref ref-type="bibr" rid="bib1.bibx11" id="paren.6"/> and are able to make useful predictions of extreme events <xref ref-type="bibr" rid="bib1.bibx2" id="paren.7"/>. The cheaper training costs associated with MSE-trained models (compared to probabilistically trained models) make them attractive for prototyping new features and model components.</p>
      <p id="d2e314">To date, most machine-learned weather forecast models only include a limited subset of forecast variables available from current NWP systems. Here, we include for the first time in the AIFS soil moisture, soil temperature and runoff together with energy sector variables such as cloud cover, 100 metre winds and solar radiation. The choice of additional variables has been guided by utility to users and with considerations of future applications of the model, alongside pragmatic considerations on data availability and readiness. Surface solar radiation and 100-metre wind speeds have been included, important for renewable energy sectors. We added an initial characterization of the land surface with prognostic soil moisture and soil temperature, important for drought forecasting. We also include snowfall, improving the representation of distinct precipitation types in the model. Finally, we have added run-off as a diagnostic model output, pushing towards a hydrological component for the AIFS.</p>
      <p id="d2e318">Despite their ability to produce skilful forecasts, machine-learned forecast models are prone to producing outputs that violate known physical relationships and limits (e.g., negative precipitation or mass imbalances). In current applications, including the pre-operational version of AIFS, post-processing of forecasts is commonly applied to remove such physical inconsistencies. Instead, we propose an additional final layer of activation functions that bound certain variables within physically meaningful limits and enforce physical constraints between related quantities. This simplifies the learning task by constraining the model output space to physically plausible regimes. This bounding strategy also proves particularly beneficial for variables with non-Gaussian distributions, such as precipitation, where the model must effectively distinguish between rain and no-rain states. Enforcing precipitation non-negativity resolves a gradient ambiguity at the zero-precipitation boundary under MSE training, greatly reducing drizzle bias and improving forecast skill in the light-precipitation regime.</p>
      <p id="d2e321">In this paper we begin by outlining the training setup of the model and how this differs from the previous AIFS version. Then we motivate and describe the new bounding strategy to make the model forecast more physically consistent. We demonstrate the improved performance of the revised AIFS version via evaluation results and selected case studies. We conclude by summarizing main results and future work in the discussion and conclusions.</p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Training</title>
      <p id="d2e332">The architecture of AIFS follows an encoder-processor-decoder design. Here, encoder and decoder are attention-based graph neural networks, and the processor is a transformer with a sliding window attention (see <xref ref-type="bibr" rid="bib1.bibx20" id="altparen.8"/> for details).</p>
      <p id="d2e338">The model operates on a reduced Gaussian grid, (N320, approximately 0.25° resolution). The processor (or hidden) grid is an O96 octahedral reduced Gaussian grid <xref ref-type="bibr" rid="bib1.bibx36" id="paren.9"/> with 40 320 grid points, approximately 1° resolution, and consists of 16 processor layers.</p>
      <p id="d2e344">AIFS is trained to produce 6 h forecasts <inline-formula><mml:math id="M1" display="inline"><mml:mrow><mml:msub><mml:mi>t</mml:mi><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> using past and present atmospheric states at <inline-formula><mml:math id="M2" display="inline"><mml:mrow><mml:msub><mml:mi>t</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">6</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M3" display="inline"><mml:mrow><mml:msub><mml:mi>t</mml:mi><mml:mn mathvariant="normal">0</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (from ERA5 or ECMWF's operational analyses at initialization, or from the model forecast itself). Longer lead times are produced auto-regressively by feeding the model's predictions back as inputs, a process commonly referred to as rollout.</p>
<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>Training schedule</title>
      <p id="d2e400">The training is divided into two phases. The first is a pre-training phase, where the model learns to predict the atmospheric state 6 h ahead (<inline-formula><mml:math id="M4" display="inline"><mml:mrow><mml:msub><mml:mi>t</mml:mi><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>) using ERA5 analysis at <inline-formula><mml:math id="M5" display="inline"><mml:mrow><mml:msub><mml:mi>t</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">6</mml:mn><mml:mtext>h</mml:mtext></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M6" display="inline"><mml:mrow><mml:msub><mml:mi>t</mml:mi><mml:mn mathvariant="normal">0</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. The second phase, rollout fine-tuning, continues from the pre-trained weights and trains the model to forecast auto-regressively up to 72 h. Here, the model learns to forecast from its own predictions. Unlike the previous AIFS version, where rollout fine-tuning was first performed using ERA5 and then followed by final fine-tuning on ECMWF operational analysis, we directly use operational analysis for the entire fine-tuning stage. This simplifies the training pipeline, reduces computational costs and is associated with improved forecast performance.</p>
      <p id="d2e447">Pre-training is performed on ERA5 data covering the years 1979–2022 (compared to 1979–2020 in the previous AIFS version), using a cosine learning rate (LR) schedule, a batch size of 16, and a total of 260 000 training steps. The LR is linearly increased from 0 to <inline-formula><mml:math id="M7" display="inline"><mml:mrow><mml:mn mathvariant="normal">5</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">4</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> during the first 1000 steps, then annealed to a minimum of <inline-formula><mml:math id="M8" display="inline"><mml:mrow><mml:mn mathvariant="normal">3</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>. This is followed by rollout fine-tuning on ECMWF operational analysis from 2016 to 2022, also using a cosine LR schedule and batch size of 16, for approximately 7900 steps (equivalent to one epoch per rollout step). The LR started at <inline-formula><mml:math id="M9" display="inline"><mml:mrow><mml:mn mathvariant="normal">1.28</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> and is annealed to the same minimum value of <inline-formula><mml:math id="M10" display="inline"><mml:mrow><mml:mn mathvariant="normal">3</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>. The rollout length is initially set to 6 h (1 step) and progressively increased by one step per epoch up to 72 h (12 steps), following the approach of <xref ref-type="bibr" rid="bib1.bibx19" id="text.10"/> and <xref ref-type="bibr" rid="bib1.bibx20" id="text.11"/>. We used the AdamW optimizer <xref ref-type="bibr" rid="bib1.bibx22" id="paren.12"/> with <inline-formula><mml:math id="M11" display="inline"><mml:mi mathvariant="italic">β</mml:mi></mml:math></inline-formula> coefficients of 0.9 and 0.95. Here, the rollout dataset is extended to eight years of operational IFS analysis (2016–2022), compared with only 2 years (2019–2020) in the previous AIFS version.</p>

<table-wrap id="T1" specific-use="star"><label>Table 1</label><caption><p id="d2e542">Variables used in the training of AIFS, with their short names, level type, variable type, normalization method, and scaling factors. Variables marked with <sup>*</sup> were newly introduced compared to AIFS v0.2.1.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="6">
     <oasis:colspec colnum="1" colname="col1" align="justify" colwidth="3cm"/>
     <oasis:colspec colnum="2" colname="col2" align="justify" colwidth="1cm"/>
     <oasis:colspec colnum="3" colname="col3" align="justify" colwidth="2cm"/>
     <oasis:colspec colnum="4" colname="col4" align="justify" colwidth="2cm"/>
     <oasis:colspec colnum="5" colname="col5" align="left"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Variable name</oasis:entry>
         <oasis:entry colname="col2" align="left">Short name</oasis:entry>
         <oasis:entry colname="col3" align="left">Level type pressure level (50–1000 hPa) or surface</oasis:entry>
         <oasis:entry colname="col4" align="left">Variable type: prognostic, diagnostic, forcing</oasis:entry>
         <oasis:entry colname="col5">Normalization</oasis:entry>
         <oasis:entry colname="col6">Scaling</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Geopotential</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M13" display="inline"><mml:mi>z</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">Pl</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M14" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">12</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Horizontal wind components</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M15" display="inline"><mml:mi>u</mml:mi></mml:math></inline-formula>, <inline-formula><mml:math id="M16" display="inline"><mml:mi>v</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">Pl</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M17" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">0.8, 0.5</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Specific humidity</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M18" display="inline"><mml:mi>q</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">Pl</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5">Std</oasis:entry>
         <oasis:entry colname="col6">0.6</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Temperature</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M19" display="inline"><mml:mi>t</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">Pl</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M20" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">6</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Surface pressure</oasis:entry>
         <oasis:entry colname="col2" align="left">sp</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M21" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">10</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Mean sea-level pressure</oasis:entry>
         <oasis:entry colname="col2" align="left">msl</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M22" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Skin temperature</oasis:entry>
         <oasis:entry colname="col2" align="left">skt</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M23" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">2 m temperature</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M24" display="inline"><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>t</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M25" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">2 m dewpoint temperature</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M26" display="inline"><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>d</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M27" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">0.5</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">10 m horizontal wind components</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M28" display="inline"><mml:mrow><mml:mn mathvariant="normal">10</mml:mn><mml:mi>u</mml:mi></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M29" display="inline"><mml:mrow><mml:mn mathvariant="normal">10</mml:mn><mml:mi>v</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5">Z-score</oasis:entry>
         <oasis:entry colname="col6">0.5, 0.5</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Total column water</oasis:entry>
         <oasis:entry colname="col2" align="left">tcw</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5">Std</oasis:entry>
         <oasis:entry colname="col6">1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Volumetric soil water level 1 and 2<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">swvl1, swvl2</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6">1, 2</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Soil temperature level 1 and 2<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">stl1, stl2</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">P</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6">1, 10</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Total precipitation</oasis:entry>
         <oasis:entry colname="col2" align="left">tp</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">Std</oasis:entry>
         <oasis:entry colname="col6">0.025</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Convective precipitation</oasis:entry>
         <oasis:entry colname="col2" align="left">cp</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">Std (tp)</oasis:entry>
         <oasis:entry colname="col6">0.0025</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Snowfall<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">sf</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">Std (tp)</oasis:entry>
         <oasis:entry colname="col6">0.025</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Total cloud cover<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">tcc</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6">0.1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">High cloud cover<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">hcc</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6">0.1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Medium cloud cover<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">mcc</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6">0.1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Low cloud cover<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">lcc</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6">0.1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Runoff<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">ro</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">Std</oasis:entry>
         <oasis:entry colname="col6">0.005</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Surface solar radiation downwards<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">ssrd</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5">Std</oasis:entry>
         <oasis:entry colname="col6">0.05</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Surface thermal radiation downwards<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left">strd</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M40" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">0.1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">100 m horizontal wind components<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M42" display="inline"><mml:mrow><mml:mn mathvariant="normal">100</mml:mn><mml:mi>u</mml:mi></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M43" display="inline"><mml:mrow><mml:mn mathvariant="normal">100</mml:mn><mml:mi>v</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">D</oasis:entry>
         <oasis:entry colname="col5"><inline-formula><mml:math id="M44" display="inline"><mml:mi>Z</mml:mi></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col6">0.1, 0.1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Land-sea mask</oasis:entry>
         <oasis:entry colname="col2" align="left">lsm</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">F</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6"/>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Orography</oasis:entry>
         <oasis:entry colname="col2" align="left"><inline-formula><mml:math id="M45" display="inline"><mml:mi>z</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">F</oasis:entry>
         <oasis:entry colname="col5">Max</oasis:entry>
         <oasis:entry colname="col6"/>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Standard deviation of sub-grid orography</oasis:entry>
         <oasis:entry colname="col2" align="left">sdor</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">F</oasis:entry>
         <oasis:entry colname="col5">Max</oasis:entry>
         <oasis:entry colname="col6"/>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Slope of sub-scale orography</oasis:entry>
         <oasis:entry colname="col2" align="left">slor</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">F</oasis:entry>
         <oasis:entry colname="col5">Max</oasis:entry>
         <oasis:entry colname="col6"/>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Insolation</oasis:entry>
         <oasis:entry colname="col2" align="left">insolation</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">F</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6"/>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1" align="left">Latitude/longitude (<inline-formula><mml:math id="M46" display="inline"><mml:mrow><mml:mi>cos⁡</mml:mi><mml:mo>/</mml:mo><mml:mi>sin⁡</mml:mi></mml:mrow></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col2" align="left">lat/lon</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">F</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1" align="left">Time of day/day of year</oasis:entry>
         <oasis:entry colname="col2" align="left">local time, julian day</oasis:entry>
         <oasis:entry colname="col3" align="left">S</oasis:entry>
         <oasis:entry colname="col4" align="left">F</oasis:entry>
         <oasis:entry colname="col5">None</oasis:entry>
         <oasis:entry colname="col6"/>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <fig id="F1" specific-use="star"><label>Figure 1</label><caption><p id="d2e1527">A selection of new variables available from the revised AIFS Single forecasts: cloud cover (left panel), surface solar radiation (centre panel), and 100 m wind speed/direction (right panel). The consistency between these new variables is clear, with areas of higher cloud cover corresponding to lower solar radiation at the surface and consistent weather patterns for 100 m winds.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f01.png"/>

        </fig>

</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title>Variables used in training</title>
      <p id="d2e1545">The variables used in the new AIFS version are listed in Table <xref ref-type="table" rid="T1"/>. As in AIFS 0.2.1, the upper atmosphere is represented by geopotential, horizontal wind components, specific humidity, and temperature at 13 pressure levels: 50, 100, 150, 200, 250, 300, 400, 500, 600, 700, 850, 925, and 1000 hPa. Newly introduced variables are marked with <sup>*</sup>. We have increased the characterization of the land surface in the model by including new prognostic variables of soil moisture at levels 1 and 2 (swvl1 and swvl2), and soil temperature at levels 1 and 2 (stl1 and stl2), important for drought monitoring and forecasting. A notion of hydrology has been included with runoff (ro), forecast as a diagnostic variable. A second set of variables, related to energy forecasting and clouds, adds real value to the model's utility. These are forecast diagnostically and include the 100 m wind components (<inline-formula><mml:math id="M48" display="inline"><mml:mrow><mml:mn mathvariant="normal">100</mml:mn><mml:mi>u</mml:mi></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M49" display="inline"><mml:mrow><mml:mn mathvariant="normal">100</mml:mn><mml:mi>v</mml:mi></mml:mrow></mml:math></inline-formula>), surface solar and thermal radiation (ssrd and strd), and cloud cover at various levels (tcc, hcc, mcc, lcc). Finally, snowfall (sf) has been added to complement the set of total precipitation-related variables. An illustration of a selection of these variables can be seen in the forecast presented in Fig. <xref ref-type="fig" rid="F1"/>, where the consistency between these new variables is clear, with areas of higher cloud cover corresponding to lower solar radiation at the surface and consistent weather patterns for 100-metre winds. These new variables are sourced from the ERA5 reanalysis and IFS operational data archive, in line with those used in the previous AIFS version (0.2.1).</p>
      <p id="d2e1581">The per variable normalization strategy used in AIFS is summarized in Table <xref ref-type="table" rid="T1"/>. Unless stated otherwise, data is normalized to zero mean and unit variance (z-score normalization). For some bounded output variables (see Sect. <xref ref-type="sec" rid="Ch1.S3"/>), only standard deviation normalization is applied to avoid shifting of the absolute zero in the normalized space. The loss function is unchanged from the previous AIFS version. Table <xref ref-type="table" rid="T1"/> shows the loss scaling factors we use in the revised AIFS version. Scaling factors were chosen empirically to ensure that all prognostic variables contribute approximately equally to the loss function, with the exception of vertical velocities and soil moisture, deliberately down-weighted. Vertical velocity is down-weighted due to known accuracy limitations in ERA5, particularly in convective regions. Soil moisture receives reduced weight for similar reasons, and additionally because the transition from ERA5-based pretraining to operational IFS analysis during fine-tuning introduces distributional inconsistencies; down-weighting mitigates the influence of this mismatch on training. Furthermore, the loss weights decrease linearly with height, so that upper atmospheric levels contribute less to the total loss. The pressure level weights are calculated following <inline-formula><mml:math id="M50" display="inline"><mml:mrow><mml:mi>w</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="normal">max</mml:mi><mml:mo>(</mml:mo><mml:mi mathvariant="normal">pressure</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi mathvariant="normal">level</mml:mi><mml:mo>/</mml:mo><mml:mn mathvariant="normal">1000</mml:mn></mml:mrow></mml:math></inline-formula>, 0.2), like in the AIFS-ENS <xref ref-type="bibr" rid="bib1.bibx21" id="paren.13"/>. A minimum weight of 0.2 is imposed in the revised version to avoid assigning excessively low values in the stratosphere.</p>
      <p id="d2e1616">AIFS is trained using data parallelism with a batch size of 16, while each model instance is distributed across four GPUs within a single node <xref ref-type="bibr" rid="bib1.bibx20" id="paren.14"/>. Training was conducted on the European supercomputer Leonardo (EuroHPC), hosted and managed by Cineca, on 64 GB A100 GPUs. Mixed-precision training is used <xref ref-type="bibr" rid="bib1.bibx23" id="paren.15"/>, and the full process takes approximately 3 d. A 10 d forecast can be produced in about 2 min and 30 s on a single A100 40 GB GPU, including data input and output.</p>

      <fig id="F2" specific-use="star"><label>Figure 2</label><caption><p id="d2e1628">Comparison of 24 h total precipitation accumulation from five forecasting systems for the forecast issued at 1 June 2023 00:00 UTC and valid at 2 June 2023 00:00 UTC: previous AIFS, revised AIFS, operational IFS, GraphCast, and FuXi. The previous AIFS, GraphCast, and FuXi all exhibit an excess light rainfall, characteristic biases of ML weather models. The revised AIFS, incorporating the bounding layer framework, largely corrects the excess light precipitation issue and provides a precipitation distribution closer to the IFS reference in the light precipitation range.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f02.png"/>

        </fig>

</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Enforcing model constraints</title>
      <p id="d2e1646">Machine-learned forecast models for numerical weather prediction show very good forecast skill, yet they are prone to producing outputs that violate known physical laws or expected statistical consistency. Unlike traditional numerical models, which are governed by equations ensuring mass conservation, positivity, or energy bounds, machine-learned forecast models lack such guarantees by default. As a result, physically implausible outputs, such as negative precipitation, can emerge. We show that incorporating constraints into the model design to enforce physical realism improves forecast skill. In this section, we first identify specific issues in the output of the previous AIFS version related to total precipitation, and then introduce a simple yet effective method to bound the model outputs using activation functions. The proposed method is not restricted to total precipitation but can be equally applied to other variables.</p>
<sec id="Ch1.S3.SS1">
  <label>3.1</label><title>Lack of physical realism in precipitation forecasts</title>
      <p id="d2e1656">The previous AIFS version suffers from significant drawbacks in forecasting precipitation. Most notably, the model's output is not constrained, leading to a frequent occurrence of negative values. This is illustrated in Fig. <xref ref-type="fig" rid="F2"/>, which compares the 24 h accumulated total precipitation forecasts from the previous AIFS version, the revised version, GraphCast <xref ref-type="bibr" rid="bib1.bibx19" id="paren.16"/>, FuXi <xref ref-type="bibr" rid="bib1.bibx7" id="paren.17"/> and an IFS (47r3) 24 h forecast, for the run initialized on 1 June 2023 at 00:00 UTC and valid at 2 June 2023 00:00 UTC. The previous AIFS model and GraphCast show spurious negative precipitation values, which are largely corrected in the revised AIFS. While negative values can be clipped to zero at inference time (as is done in FuXi in this figure and thus non visible), their presence highlights a lack of physical consistency in the model.</p>
      <p id="d2e1667">In addition to the negative values, a second noticeable issue, also visible in Fig. <xref ref-type="fig" rid="F2"/> and present for all the models but the AIFS revised version, is the excess of light precipitation in the forecast. The models produce excessive light rain leading to a bias in the forecast. Similar behaviour has been reported in benchmark studies such as WeatherBench 2 <xref ref-type="bibr" rid="bib1.bibx29" id="paren.18"/>, where AI-based systems including GraphCast, Pangu-Weather, and FuXi produce overly smooth precipitation fields and inflated frequencies of weak events, despite substantial architectural differences.</p>
      <p id="d2e1675">This is further supported by verification metrics computed against in situ observations (SYNOP stations). The Frequency Bias Index (FBI) scores for 2023 over Europe (Fig. <xref ref-type="fig" rid="F3"/>) confirm that the pre-operational AIFS systematically over-forecasts light precipitation events (<inline-formula><mml:math id="M51" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> mm). While a similar tendency is present in the IFS, it is considerably more pronounced in the machine-learned forecast model. At the other end of the distribution, the model tends to under-forecast more intense precipitation, as indicated by FBI values well below unity for thresholds exceeding 10 mm. This may be attributed to a well-known characteristic of machine learning-based forecasts: a tendency to produce overly smooth spatial fields, which can suppress extremes <xref ref-type="bibr" rid="bib1.bibx2 bib1.bibx4" id="paren.19"/>. Additionally, the coarser native resolution of AIFS (N320 0.25° grid) compared to IFS (0.1° grid) reduces its spatial representativeness.</p>

      <fig id="F3" specific-use="star"><label>Figure 3</label><caption><p id="d2e1696">Frequency Bias Index (FBI, top panels) and Peirce Skill Score (PSS, bottom panels) for 24 h accumulated precipitation over Europe as a function of threshold, at forecast day 1, 3, and 6 (left to right panels). Scores are averaged over all initialisation dates in 2023. Filled markers indicate that the difference relative to the previous AIFS version is statistically significant (paired Wilcoxon signed-rank test, <inline-formula><mml:math id="M52" display="inline"><mml:mrow><mml:mi>p</mml:mi><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0.05</mml:mn></mml:mrow></mml:math></inline-formula>); open markers indicate non-significant differences. The previous AIFS version exhibits a pronounced positive frequency bias at low thresholds, consistent with systematic overforecasting of light precipitation.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f03.png"/>

        </fig>

      <fig id="F4" specific-use="star"><label>Figure 4</label><caption><p id="d2e1719">Comparison of 24 h total and convective precipitation forecast from the previous AIFS version, together with a map showing the difference between the two of them for the forecast issued at 1 June 2023 00:00 UTC and valid at 2 June 2023 00:00 UTC. Positive values (coloured regions) in the difference plot indicate areas where convective precipitation is greater than the total precipitation.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f04.png"/>

        </fig>

      <p id="d2e1728">Convective precipitation forecasts also exhibit similar shortcomings. In addition, there is a further lack of physical consistency. Convective precipitation represents the part of the total precipitation that originates from convection, and therefore should always be less than or equal to the total. Figure <xref ref-type="fig" rid="F4"/> shows the previous AIFS 24 h accumulated forecasts of total and convective precipitation for 2 June 2023. The map displaying the difference between the two reveals frequent cases in which convective precipitation exceeds total precipitation, which should not occur.</p>
      <p id="d2e1733">The CREDIT platform <xref ref-type="bibr" rid="bib1.bibx31" id="paren.20"/> has recently been used to explore physically informed constraints for addressing drizzle bias: <xref ref-type="bibr" rid="bib1.bibx33" id="text.21"/> implemented global mass and energy conservation schemes as modular constraints within FuXi and demonstrated a direct reduction of drizzle bias; a companion study <xref ref-type="bibr" rid="bib1.bibx32" id="paren.22"/> further showed that incorporating terrain-following (hybrid sigma-pressure) can improve extreme precipitation forecasts.</p>
      <p id="d2e1745">Here, we address the drizzle and negative precipitation issue through  simplified intervention: enforcing only the physically admissible output range via a hard-constraint. This approach is described in Sect. <xref ref-type="sec" rid="Ch1.S3.SS2"/>. In Sect. <xref ref-type="sec" rid="Ch1.S4.SS1"/>, we show that this minimal architectural modification fundamentally reshapes the loss landscape in the vicinity of zero precipitation, eliminating gradient ambiguity and substantially reducing light-precipitation bias.</p>
</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title>Bounding the outputs with activation functions</title>
      <p id="d2e1760">Precipitation has been used as an example to demonstrate the biases present in the forecasts of some variables. These issues are not only limited to precipitation, but are also observed in all sparsely distributed variables. This behaviour can be avoided by constraining the output of the model.</p>
      <p id="d2e1763">There are different strategies one could adopt to enforce physical constraints into the ML model. More specifically, here we tackled unphysical outputs, and we did not consider other constraints such as energy or mass conservation. Introducing loss penalties for outputs that fall outside the known physical bounds can be an effective strategy, and it has the advantage of not requiring any specific model change. Alternatively, the model could be modified in such a way as to prevent output from exceeding variable-specific physical bounds. This is usually referred to as hard-constraining. There are some examples in the literature of hard-constrained machine-learned models for climate and weather, such as <xref ref-type="bibr" rid="bib1.bibx12" id="text.23"/>. The authors apply a softmax function, a generalization of the logistic function, as a hard-constraint for predicting quantities like atmospheric water content, to enforce the output to be non-negative in climate downscaling. Other examples can be found in <xref ref-type="bibr" rid="bib1.bibx18" id="text.24"/>, <xref ref-type="bibr" rid="bib1.bibx5" id="text.25"/> or <xref ref-type="bibr" rid="bib1.bibx34" id="text.26"/>. Similarly, we argue that hard constraints on the output can be enforced using an activation function.</p>
      <p id="d2e1778">Activation functions can be used in a straightforward way to enforce bounds in the output of machine-learned forecast models. Arguably, the most famous activation function and one we used in this work is the Rectified Linear Unit (ReLU), a nonlinear function defined as:

            <disp-formula id="Ch1.E1" content-type="numbered"><label>1</label><mml:math id="M53" display="block"><mml:mrow><mml:mi mathvariant="normal">ReLU</mml:mi><mml:mo>(</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mi mathvariant="normal">max</mml:mi><mml:mo>(</mml:mo><mml:mn mathvariant="normal">0</mml:mn><mml:mo>,</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>

          ReLU maps all negative values to zero, effectively enforcing a hard lower bound on the output.</p>
      <p id="d2e1812">For variables requiring both upper and lower bounds, such as concentrations or fractions, the Hard Hyperbolic Tangent (HardTanh) function is an effective choice. It is a piecewise linear approximation of the hyperbolic tangent, defined as:

            <disp-formula id="Ch1.Ex1"><mml:math id="M54" display="block"><mml:mrow><mml:mi mathvariant="normal">HardTanh</mml:mi><mml:mo>(</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mfenced close="" open="{"><mml:mtable class="array" columnalign="center left"><mml:mtr><mml:mtd><mml:mn mathvariant="normal">0</mml:mn></mml:mtd><mml:mtd><mml:mrow><mml:mi mathvariant="normal">if</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi>x</mml:mi><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mi>x</mml:mi></mml:mtd><mml:mtd><mml:mrow><mml:mi mathvariant="normal">if</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mn mathvariant="normal">0</mml:mn><mml:mo>≤</mml:mo><mml:mi>x</mml:mi><mml:mo>≤</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mn mathvariant="normal">1</mml:mn></mml:mtd><mml:mtd><mml:mrow><mml:mi mathvariant="normal">if</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi>x</mml:mi><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mfenced><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>

          HardTanh can also be used to enforce consistency between related output variables. For instance, consider the case of convective precipitation (Fig. <xref ref-type="fig" rid="F4"/>), which is predicted independently of total precipitation in the previous AIFS version. There is a clear relation between the two quantities: convective precipitation is a fraction of total precipitation and should never exceed it. A more physically consistent approach is to map the original convective output to the [0, 1] range using a HardTanh layer and to multiply this output by the predicted total precipitation: 

            <disp-formula id="Ch1.E2" content-type="numbered"><label>2</label><mml:math id="M55" display="block"><mml:mrow><mml:mi mathvariant="normal">cp</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="normal">HardTanh</mml:mi><mml:mo>(</mml:mo><mml:msup><mml:mi mathvariant="normal">cp</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>)</mml:mo><mml:mo>×</mml:mo><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>

          where cp<sup>′</sup> is the convective precipitation output before the activation layer. This guarantees consistency. This type of constraint, referred to as FractionBounding, is applied to variables related to total precipitation and total cloud cover.</p>
      <p id="d2e1926">Clipping the precipitation output in inference is a possibility and a common practice. This was the case in the pre-operational AIFS model and also reported in other studies, such as <xref ref-type="bibr" rid="bib1.bibx1" id="text.27"/>. However, we show that the introduction of bounding in the output during training has benefits beyond simply avoiding slightly negative or unphysical values: it can facilitate the learning of forecasting for sparse and intermittent variables. Bounding effectively decomposes the prediction space into two distinct regions. In the case of total precipitation, the negative space becomes a proxy for forecasting the non-event, while the positive space corresponds to the occurrence of precipitation. This decomposition may, in principle, help the model more easily perform a classification between event and non-event outcomes, a distinction the previous AIFS version struggles with.</p>
      <p id="d2e1932">Table <xref ref-type="table" rid="T2"/> summarises the bounding strategy used in the new version of the AIFS. Since bounding is performed on the normalized space, the choice of the normalization strategy is essential. In particular, variables bounded using a ReLU function were normalized using the standard deviation only, as indicated in Table <xref ref-type="table" rid="T1"/>, to avoid offsetting the zero value. Since snowfall and convective precipitation are predicted as fractions of total precipitation, it is necessary to ensure consistent magnitudes in the normalized space. Therefore, cp and sf were scaled using the standard deviation of total precipitation rather than their own. Total cloud cover and soil moisture variables (swvl1 and swvl2) were not normalized, since their range falls within the constraints imposed by the HardTanh bounding ([0, 1]).</p>

<table-wrap id="T2" specific-use="star"><label>Table 2</label><caption><p id="d2e1942">Summary of bounding strategies used in the new version of AIFS. </p></caption><oasis:table frame="topbot"><oasis:tgroup cols="3">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Bounding type</oasis:entry>
         <oasis:entry colname="col2">Range</oasis:entry>
         <oasis:entry colname="col3">Variables</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">ReluBounding</oasis:entry>
         <oasis:entry colname="col2">[0, <inline-formula><mml:math id="M57" display="inline"><mml:mi mathvariant="normal">∞</mml:mi></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col3">tp, ro, tcw, ssrd, <inline-formula><mml:math id="M58" display="inline"><mml:mi>q</mml:mi></mml:math></inline-formula>(50–1000 hPa)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">HardtanhBounding</oasis:entry>
         <oasis:entry colname="col2">[0, 1]</oasis:entry>
         <oasis:entry colname="col3">tcc, swvl1, swvl2</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">FractionBounding (w.r.t. tp)</oasis:entry>
         <oasis:entry colname="col2">[0, 1]</oasis:entry>
         <oasis:entry colname="col3">cp, sf</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">FractionBounding (w.r.t. tcc)</oasis:entry>
         <oasis:entry colname="col2">[0, 1]</oasis:entry>
         <oasis:entry colname="col3">lcc, mcc, hcc</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

</sec>
</sec>
<sec id="Ch1.S4">
  <label>4</label><title>Evaluation</title>
      <p id="d2e2045">Unless otherwise stated, all verification results presented in this section are based on twice-daily forecasts initialised at 00:00 and 12:00 UTC for every day of 2023, verified against operational IFS analyses.</p>

      <fig id="F5" specific-use="star"><label>Figure 5</label><caption><p id="d2e2050">Anomaly correlation skill score difference for Geopotential at 500 hPa and Temperature at 850 hPa for 2023. This controlled comparison shows: (1) AIFS revised model (full system with all modifications), (2) AIFS revised trained with limited data (ERA5 up to 2020, rollout fine-tuning 2019–2020 only), and (3) AIFS previous version. The close agreement between configurations (2) and (3) demonstrates that the substantial performance gain is primarily attributable to the expanded training dataset (ERA5 1979–2022 and rollout data 2016–2022). Solid points indicate statistically significant differences relative to AIFS revised used as reference (paired Wilcoxon signed-rank test, <inline-formula><mml:math id="M59" display="inline"><mml:mrow><mml:mi>p</mml:mi><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0.05</mml:mn></mml:mrow></mml:math></inline-formula>).</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f05.png"/>

      </fig>

      <p id="d2e2071">The revised AIFS version delivers highly skilled forecasts, as shown by anomaly correlation scores for 2023 in the Northern Hemisphere (Fig. <xref ref-type="fig" rid="F8"/>). In the medium range (3–10 d), AIFS outperforms the IFS by 12 to 24 h in skill. Forecast skill is also clearly improved compared to the previous AIFS version. This performance gain can be attributed to the combined effect of increased training data, improvements in rollout fine-tuning, the implementation of output bounding, and the inclusion of new prognostic variables. To quantify the specific contribution of expanded training data, we present a controlled comparison in Fig. <xref ref-type="fig" rid="F5"/>. We verify against the operational IFS analysis, which is also used to initialise the forecasts.</p>
      <p id="d2e2079">As shown in Fig. <xref ref-type="fig" rid="F5"/>, the expanded training dataset contributes to the most important portion of the overall performance gain. This indicates that data availability (ERA5 extended to 2022 and rollout fine-tuning expanded from 2019–2020 to 2016–2022) plays a major role. The remaining improvement stems from other system modifications, including rollout fine-tuning schedules, output bounding layers, and expanded prognostic variables. Due to the high computational cost, a detailed ablation study to isolate the impact of each individual modification beyond data expansion was not performed; thus, the observed improvements represent the cumulative result of these integrated system updates. It should be noted that the close agreement between AIFS revised (2020 data) and AIFS previous in ACC should be interpreted with caution, as these configurations differ in their training protocols: AIFS previous includes a rollout fine-tuning phase on ERA5 which AIFS revised (2020) does not, and uses only 2 years (2019–2020) of operational data for final rollout fine-tuning compared to 6 years (2016–2022) in the full revised version. Furthermore, similar ACC scores do not imply equivalent forecast quality. As shown in Fig. <xref ref-type="fig" rid="F6"/>, AIFS revised (2020) exhibits less mesoscale smoothing than AIFS previous despite comparable ACC, indicating that the changes introduced in the revised system do contribute positively to forecast quality in ways not fully captured by ACC alone.</p>

      <fig id="F6" specific-use="star"><label>Figure 6</label><caption><p id="d2e2088">Z500 power spectral density as a function of zonal wavenumber (bottom axis) and approximate horizontal scale in km (top axis) for forecast lead times Day 1, 3, 5, and 10 during JJA 2023. Spectra from the revised AIFS (blue), AIFS revised trained with limited data (ERA5 up to 2020, rollout fine-tuning 2019-2020 only) in dashed orange, and previous AIFS (orange) are compared against the IFS analysis (black). Insets highlight the 450–600 km scale range (zonal wavenumbers 70–90), corresponding to large mesoscale structures. The revised AIFS shows improved agreement with the IFS analysis at large mesoscale structures, particularly at longer lead times, indicating a better representation and retention of mesoscale variance.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f06.png"/>

      </fig>

      <p id="d2e2097">Additionally, imposing a minimum on the loss weights in the stratosphere leads to significant improvements in the data-driven forecasts at 100 and 50 hPa (Fig. <xref ref-type="fig" rid="F9"/>). For temperature at 100 hPa, the new version of the AIFS outperforms the IFS, while for 50 hPa wind speed, the gap in skill between the previous version of AIFS and the IFS in the stratosphere is significantly reduced.</p>
      <p id="d2e2102">Forecast skill for key surface variables, such as 2 m temperature and 10 m wind speed, verified against SYNOP observations, is similarly improved (Fig. <xref ref-type="fig" rid="F10"/>). Overall, the new AIFS version exhibits improvements of around 4 %–6 % across all variables, lead times, and pressure levels relative to the previous AIFS version, as shown in the scorecard presented in Fig. <xref ref-type="fig" rid="F7"/>. The performance of the model for tropical cyclone prediction is similar to that of the previous version (see <xref ref-type="bibr" rid="bib1.bibx20" id="altparen.28"/>), with some small improvements to track position. The training configuration, including a maximum rollout length of 12 (72 h), was retained from the previous AIFS version, as shown in Sect. <xref ref-type="sec" rid="Ch1.S2.SS1"/>. This parameter is known to influence spectral characteristics, with longer rollouts leading to enhanced damping. No explicit tuning was performed to target spectral behaviour.</p>

      <fig id="F7" specific-use="star"><label>Figure 7</label><caption><p id="d2e2116">Scorecard comparing forecast scores of AIFS revised versus the previous AIFS version for the whole year of 2023. Forecasts are initialised on 00:00 and 12:00 UTC. Relative score changes are shown as function of lead time (day 1 to 10) for northern extra-tropics (n.hem), southern extra-tropics (s.hem) and tropics. Blue colours mark score improvements and red colours score degradations. Purple colours indicate an increased in standard deviation of forecast anomaly, while green colours indicate a reduction. Framed rectangles indicate 95 % significance level. Numbers behind variable abbreviations indicate variables on pressure levels (e.g., 500 hPa), and suffix indicates verification against IFS NWP analyses (an) or radiosonde and SYNOP observations (ob). Scores shown are anomaly correlation (ccaf), SEEPS (seeps, for 24 h precipitation accumulation),  RMSE (rmsef) and standard deviation of forecast anomaly (sdaf).</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f07.png"/>

      </fig>

      <fig id="F8" specific-use="star"><label>Figure 8</label><caption><p id="d2e2128">Anomaly correlation skill scores for geopotential and temperature at 500 and 850 hPa, respectively. Skill scores computed for the Northern Hemisphere for the whole of 2023 against IFS analysis. In the medium range, AIFS revised outperforms the IFS by 12 to 24 h in skill. Forecast skill is also clearly improved compared to the previous AIFS version.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f08.png"/>

      </fig>

      <fig id="F9" specific-use="star"><label>Figure 9</label><caption><p id="d2e2139">Anomaly correlation skill scores for temperature at 100 hPa and wind speed at 50 hPa. Skill scores computed for the Northern Hemisphere for the whole of 2023 against IFS analysis. Significant improvements in the revised AIFS forecasts at 100 and 50 hPa when compared against the previous AIFS version.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f09.png"/>

      </fig>

      <fig id="F10" specific-use="star"><label>Figure 10</label><caption><p id="d2e2150">RMSE scores for 2 m temperature and 10 m wind speed computed against SYNOP observations over the Northern Hemisphere. The revised AIFS version shows improvement when compared to the previous verision of the AIFS.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f10.png"/>

      </fig>

      <p id="d2e2159">The resulting Z500 power spectral density shown in Fig. <xref ref-type="fig" rid="F6"/> are very similar to those of the previous AIFS across scales, including the <inline-formula><mml:math id="M60" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">500</mml:mn></mml:mrow></mml:math></inline-formula> km range (zonal wavenumbers 70–90), with slightly improved agreement with the IFS analysis at longer lead times. At the same time, the RMSE-based scorecard (Fig. <xref ref-type="fig" rid="F7"/>) shows overall improvements. Taken together, these results indicate that the skill gains are not achieved at the expense of degraded spatial variability.</p>
      <p id="d2e2176">Figure <xref ref-type="fig" rid="F11"/> presents verification metrics for several variables introduced in the new version. In line with those already present in earlier versions, AIFS shows a gain in forecast skill of around 1 d in the medium range for surface short-wave downwards radiation verified against geostationary satellite observation via CMSAF <xref ref-type="bibr" rid="bib1.bibx28" id="paren.29"/> and 100 m wind speed verified against ECMWF operational analysis, relative to the IFS. The population distribution for total cloud cover verified against SYNOP observations, however, highlights the inherent limitations of MSE-trained AI models. While the observed distribution follows a U-shape, with high frequency at the tails of the distribution (clear skies and overcast conditions), AIFS produces a much flatter distribution, under-predicting these extremes and over-estimating intermediate values. This behaviour is closely linked to the smoothing effect introduced by the MSE loss function, which tends to penalize large deviations and thereby suppress extremes (see Sect. <xref ref-type="sec" rid="Ch1.S5"/>).</p>

      <fig id="F11" specific-use="star"><label>Figure 11</label><caption><p id="d2e2189">Forecast RMSE computed against operational IFS analysis and distribution comparison for new variables. <bold>(a)</bold> Surface solar radiation downwards RMSE for March–May (MAM) 2023, <bold>(b)</bold> 100 m wind speed RMSE for the full year 2023, <bold>(c)</bold> total cloud cover distribution for June–August (JJA) 2023. Blue lines show the AIFS revised and red lines show IFS; observations are shown in grey in panel <bold>(c)</bold>. AIFS shows significant gains in forecast skill in the medium range for surface short-wave downwards radiation and 100 m winds when compared against the IFS. The mismatch in population distribution for total cloud cover forecast highlights the inherent limitations of MSE-trained AI models.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f11.png"/>

      </fig>

      <fig id="F12" specific-use="star"><label>Figure 12</label><caption><p id="d2e2212">SEEPS skill scores for 2023 based on 24 h accumulated precipitation from SYNOP observations, comparing the revised AIFS (blue), the previous AIFS version (orange), and the IFS (red) across different regions. Results show a consistent and statistically significant improvement across all lead times and in the Northern Hemisphere and the Southern Hemisphere for the revised AIFS version when compared to the previous AIFS version and the IFS.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f12.png"/>

      </fig>

      <p id="d2e2221">The forecasting skill of the model with respect to 24 h accumulated total precipitation is significantly improved. The new AIFS version is compared against both the previous AIFS version and the operational IFS (cycles 47r3 and 48r1) in Fig. <xref ref-type="fig" rid="F12"/>. The Stable Equitable Error in Probability Space (SEEPS) skill score <xref ref-type="bibr" rid="bib1.bibx30" id="paren.30"/> is used as the primary verification metric, with 24 h accumulated precipitation SYNOP observations serving as the reference. Results show a consistent and statistically significant improvement across all lead times and in the Northern Hemisphere and the Southern Hemisphere. The revised AIFS demonstrates approximately a 1 d gain in forecast skill relative to both IFS and the previous AIFS version. The forecast fields also exhibit noticeable improvements, as illustrated in Fig. <xref ref-type="fig" rid="F2"/>. The new version of the AIFS produces no negative values in the output and substantially reduces light precipitation, aligning more closely with the 24 h total precipitation accumulation fields derived from the IFS operational short-range forecasts.</p>
      <p id="d2e2231">Figure <xref ref-type="fig" rid="F3"/> reveals where the improvement originates. The Frequency Bias Index (FBI, <xref ref-type="bibr" rid="bib1.bibx38" id="altparen.31"/>), defined as the ratio of predicted to observed event frequency at a given threshold (<inline-formula><mml:math id="M61" display="inline"><mml:mrow><mml:mi mathvariant="normal">FBI</mml:mi><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:mi>H</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">FA</mml:mi><mml:mo>)</mml:mo><mml:mo>/</mml:mo><mml:mo>(</mml:mo><mml:mi>H</mml:mi><mml:mo>+</mml:mo><mml:mi>M</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="M62" display="inline"><mml:mi>H</mml:mi></mml:math></inline-formula> are hits, FA false alarms, and <inline-formula><mml:math id="M63" display="inline"><mml:mi>M</mml:mi></mml:math></inline-formula> misses), and the Peirce Skill Score (PSS, also known as the Hanssen–Kuipers discriminant; <xref ref-type="bibr" rid="bib1.bibx16" id="altparen.32"/>), defined as the difference between the probability of detection and the probability of false detection (<inline-formula><mml:math id="M64" display="inline"><mml:mrow><mml:mi mathvariant="normal">PSS</mml:mi><mml:mo>=</mml:mo><mml:mi>H</mml:mi><mml:mo>/</mml:mo><mml:mo>(</mml:mo><mml:mi>H</mml:mi><mml:mo>+</mml:mo><mml:mi>M</mml:mi><mml:mo>)</mml:mo><mml:mo>-</mml:mo><mml:mi mathvariant="normal">FA</mml:mi><mml:mo>/</mml:mo><mml:mo>(</mml:mo><mml:mi mathvariant="normal">FA</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">CN</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, where CN are correct negatives), are shown for the Northern Hemisphere for different thresholds. The previous AIFS version exhibits a strong tendency to over-predict light precipitation events (<inline-formula><mml:math id="M65" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> mm) across all lead times, as shown by the FBI. This bias is substantially corrected due to the bounding (see Sect. <xref ref-type="sec" rid="Ch1.S4.SS1"/>) in the revised AIFS.</p>
      <p id="d2e2343">While the AI model still slightly over-predicts light precipitation compared to the IFS, it demonstrates competitive skill for light precipitation. The AIFS excels at medium-intensity events (1–10 mm), with PSS scores significantly higher than those of the IFS. At higher thresholds (<inline-formula><mml:math id="M66" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula> mm), corresponding to moderate to heavy precipitation, the AIFS diverges from the IFS, with a marked under-prediction (FBI <inline-formula><mml:math id="M67" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 1). This is likely caused by smoothing introduced by the loss function, in combination with the model’s coarser spatial resolution.</p>
      <p id="d2e2364">This under-prediction plays an important role in the metrics concerning more extreme events, since both the previous and the revised AIFS models underperform IFS for thresholds exceeding 10 mm in terms of PSS, but remains competitive. This suggests that although the AI models predict fewer high-intensity events, their predictions are more accurate when they do occur. Finally, the revised AIFS shows a marginal improvement in terms of PSS compared against the previous AIFS version, possibly due to improvements in the learning-rate scheduling used for fine-tuning and additional training data.</p>
<sec id="Ch1.S4.SS1">
  <label>4.1</label><title>Evaluating the effects of bounding on total precipitation</title>
      <p id="d2e2374">Overall, the revised AIFS version demonstrates significant improvements in forecasting skill for total precipitation over its predecessor. The bounding of total precipitation transforms the prediction space such that negative values correspond to “no-rain” and positive values to “rain”. This separation enables the model to more effectively distinguish between the two scenarios. It removes the pressure to forecast exactly zero and facilitates the classification task inherent to precipitation forecasting.</p>
      <p id="d2e2377">Other factors that might improve the precipitation forecast skill in the revised AIFS version are the inclusion of additional variables, the improved learning rate scheduling for rollout fine-tuning and the expansion of the training dataset. To isolate the effect of the bounding mechanism, we retrained the revised AIFS version using the exact same training configuration and data extent, with the sole exception of omitting the bounding layer for total precipitation. This controlled baseline, hereafter referred to as “AIFS revised no-bounding”, allows for a direct comparison between the two models. The SEEPS skill score for the June-July-August 2023 season is shown in Fig. <xref ref-type="fig" rid="F13"/>. The results show that the improvement observed in total precipitation forecast skill in the revised AIFS version can mainly be attributed to constraining the output, since the revised AIFS version without bounding performs similarly to the previous AIFS version.</p>

      <fig id="F13" specific-use="star"><label>Figure 13</label><caption><p id="d2e2384">SEEPS skill scores for 2023 JJA comparing revised AIFS (blue), revised AIFS without bounding (black), previous AIFS (orange), and IFS (red) across different regions. The improvement observed in total precipitation forecast skill in the revised AIFS version can mainly be attributed to bounding the output of the model.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f13.png"/>

        </fig>

      <p id="d2e2394">The physical consistency of convective precipitation forecast in respect to total precipitation can also be evaluated for a given forecast to assess the utility of the FractionBounding strategy used. Figure <xref ref-type="fig" rid="F14"/> presents the 24 h total and convective precipitation accumulation together with a map showing the difference between the two for a forecast issued at 1 June 2023 00:00 UTC and valid at 2 June 2023 00:00 UTC. Unlike the previous AIFS version (Fig. <xref ref-type="fig" rid="F4"/>), the convective precipitation forecast is now consistent with the predicted total precipitation accumulation.</p>

      <fig id="F14" specific-use="star"><label>Figure 14</label><caption><p id="d2e2403">Comparison of 24 h total and convective precipitation accumulation forecast from the revised AIFS version, together with a map showing the difference between the two of them for the forecast issued at 1 June 2023 00:00 UTC and valid at 2 June 2023 00:00 UTC. Unlike the previous AIFS version (Fig. <xref ref-type="fig" rid="F4"/>), the convective precipitation forecast is now consistent with the predicted total precipitation accumulation and no coloured regions (cp <inline-formula><mml:math id="M68" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> tp) appear in the difference plot.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f14.png"/>

        </fig>

      <fig id="F15" specific-use="star"><label>Figure 15</label><caption><p id="d2e2423">Comparison of 6 h total precipitation from previous AIFS, revised AIFS without the final ReLU layer to show the negative space, and the standard revised AIFS with the final ReLU layer. Forecasts are initialised at 1 June 2023 00:00 UTC and valid at 1 June 2023 06:00 UTC. Removing the final bounding layer from the AIFS revised model reveals the behaviour of the negative space for the total precipitation variable. The model has implicitly learned to use the negative space as a proxy for “no-rain” classification.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f15.png"/>

        </fig>

      <p id="d2e2432">To better understand the mechanisms governing total precipitation forecasts in the revised AIFS configuration, we examine the model's behaviour in the negative pre-activation space obtained by removing the final ReLU layer at inference. Figure <xref ref-type="fig" rid="F15"/> reveals that this nominally hidden negative space is neither random nor noisy, but highly structured.</p>
      <p id="d2e2437">At first glance, bounding an output variable with a ReLU activation may appear to introduce a drawback: the negative pre-activation space is not directly penalized, since all negative values are projected to zero before the loss is evaluated. In principle, changes within this region do not influence the weight updates. One might therefore expect the negative space to be uninformative or unstable.</p>
      <p id="d2e2441">Instead, we observe a coherent and physically meaningful organization. Persistently dry regions, such as the Sahara Desert, exhibit strongly negative pre-activations, while areas approaching precipitation events transition smoothly toward zero. The model has therefore learned to encode dryness in the negative space, effectively using it as a latent representation of the “no-rain” regime.</p>
      <p id="d2e2444">This observation motivates two fundamental questions: <list list-type="custom"><list-item><label>i.</label>
      <p id="d2e2449">why does the negative pre-activation space contain coherent and physically meaningful structure, and </p></list-item><list-item><label>ii.</label>
      <p id="d2e2454">why does enforcing a non-negativity constraint during training improve light-precipitation skill?</p></list-item></list> We argue that the first arises from the shared latent representation of the atmospheric state learned by the network, while the second is governed by the symmetry properties of the MSE gradient near the zero-precipitation boundary.</p>
<sec id="Ch1.S4.SS1.SSS1">
  <label>4.1.1</label><title>Representation of dry states in the negative space</title>
      <p id="d2e2466">In this study we argue that the structure present in the negative space is an emergent feature arising from the shared representation of atmospheric states.</p>
      <p id="d2e2469">The model encodes input prognostic (<inline-formula><mml:math id="M69" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) and forcing variables (<inline-formula><mml:math id="M70" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold">F</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) into a high-dimensional latent space (<inline-formula><mml:math id="M71" display="inline"><mml:mrow><mml:msub><mml:mi>z</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) via an encoder:

              <disp-formula id="Ch1.E3" content-type="numbered"><label>3</label><mml:math id="M72" display="block"><mml:mrow><mml:msub><mml:mi>z</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mi mathvariant="normal">Encoder</mml:mi><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi mathvariant="bold">F</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>

            This latent state is evolved to the next time-step through the processor (e.g., via attention-based computations):

              <disp-formula id="Ch1.E4" content-type="numbered"><label>4</label><mml:math id="M73" display="block"><mml:mrow><mml:msub><mml:mi>z</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi mathvariant="script">F</mml:mi><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>z</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:mfenced></mml:mrow></mml:math></disp-formula>

            and then decodes back into the physical space to obtain the forecast at <inline-formula><mml:math id="M74" display="inline"><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:math></inline-formula> of prognostic (<inline-formula><mml:math id="M75" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>) and diagnostic (<inline-formula><mml:math id="M76" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold">D</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>) variables. It is worth mentioning here that <inline-formula><mml:math id="M77" display="inline"><mml:mrow><mml:msub><mml:mi>z</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> encodes the physical state of all the prognostic variables in a shared representation space and the diagnostic variables are decoded from it. The diagnostic precipitation output is thus produced by a specific decoder head:

              <disp-formula id="Ch1.E5" content-type="numbered"><label>5</label><mml:math id="M78" display="block"><mml:mrow><mml:msub><mml:mi mathvariant="italic">η</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi mathvariant="normal">Decoder</mml:mi><mml:mi mathvariant="normal">tp</mml:mi></mml:msub><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>z</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:mfenced></mml:mrow></mml:math></disp-formula>

            where <inline-formula><mml:math id="M79" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> represents the pre-activation total precipitation. The final physical output is obtained via the bounding layer:

              <disp-formula id="Ch1.E6" content-type="numbered"><label>6</label><mml:math id="M80" display="block"><mml:mrow><mml:msub><mml:mi mathvariant="normal">tp</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi mathvariant="normal">ReLU</mml:mi><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi mathvariant="italic">η</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mi mathvariant="normal">max</mml:mi><mml:mfenced open="(" close=")"><mml:mrow><mml:mn mathvariant="normal">0</mml:mn><mml:mo>,</mml:mo><mml:msub><mml:mi mathvariant="italic">η</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d2e2720">Because Decoder<sub>tp</sub> maps from a latent space optimized for smooth gradients (<inline-formula><mml:math id="M82" display="inline"><mml:mrow><mml:msub><mml:mi>z</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>), <inline-formula><mml:math id="M83" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> inherits this spatial structure. The precipitation decoder head learns a smooth mapping from the latent space encoding the moisture state of the system to physical precipitation in the positive regime (<inline-formula><mml:math id="M84" display="inline"><mml:mrow><mml:mi mathvariant="italic">η</mml:mi><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>), where gradients are active. Because neural networks are continuous functions biased toward smoothness, this “moisture-to-precipitation” logic naturally extrapolates into the negative regime. As moisture variables decrease, the decoder continues to output decreasing values, pushing <inline-formula><mml:math id="M85" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> into the negative space.</p>
      <p id="d2e2774">While the precipitation head receives no direct gradients when <inline-formula><mml:math id="M86" display="inline"><mml:mrow><mml:mi mathvariant="italic">η</mml:mi><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>, the latent variables that serve as its input are not static. These latent features are shared with prognostic variables (e.g., specific humidity <inline-formula><mml:math id="M87" display="inline"><mml:mi>q</mml:mi></mml:math></inline-formula>, total water content tcw, etc) and receive continuous gradient information from their respective loss functions. Consequently, the negative space of the tp field is “indirectly learned”; it is a projection of a latent space that is being rigorously optimized.</p>
      <p id="d2e2797">Ultimately, this reveals that the optimization of the shared latent space is driven by the collective constraints of all output variables. In this framework, the negative pre-activation space for precipitation serves as a “saturation deficit” proxy that is kept physically consistent by the gradients flowing from prognostic moisture fields. The shared representation of the atmosphere in the latent space allows the model to maintain a sophisticated, structured representation of dryness even in the absence of direct precipitation gradients.</p>
      <p id="d2e2800">To provide empirical weight to this mechanistic theory, we investigate the information content within the pre-activation space <inline-formula><mml:math id="M88" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> by partitioning the model output into three distinct physical regimes: the negative (non-precipitating) space, the light precipitation regime (0–0.5 mm per 6 h), and the moderate precipitation regime (0.5–10 mm per 6 h).</p>
      <p id="d2e2810">We hypothesize that the pre-activation space <inline-formula><mml:math id="M89" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> undergoes a fundamental physical decoupling as it transitions from dry to wet conditions. In the negative (non-precipitating) regime, the absence of precipitation is a deterministic function of low humidity; thus, the decoder should preserve a strong linear mapping from the prognostic moisture fields.</p>
      <p id="d2e2820">Conversely, we expect this linear correlation to weaken in the light precipitation regime (<inline-formula><mml:math id="M90" display="inline"><mml:mrow><mml:mn mathvariant="normal">0</mml:mn><mml:mo>&lt;</mml:mo><mml:mi mathvariant="italic">η</mml:mi><mml:mo>≤</mml:mo><mml:mn mathvariant="normal">0.5</mml:mn></mml:mrow></mml:math></inline-formula> mm). While moisture remains a necessary condition for rain, the exact accumulation at these low intensities becomes increasingly stochastic, influenced by non-linear factors such as sub-grid scale turbulence, cloud-base evaporation, and microphysical uncertainties. These processes act as “interference”, decoupling the surface precipitation from the column moisture signal.</p>
      <p id="d2e2839">We performed a global correlation analysis on a single forecast issued at 1 June 2023 00:00 UTC. For this experiment, we utilize the AIFS revised model without the final bounding layer on tp during inference, but activated during training. We focus our analysis on the first 120 h (5 d) of the forecast.</p>

      <fig id="F16" specific-use="star"><label>Figure 16</label><caption><p id="d2e2845">Regime-dependent correlations of pre-activation <inline-formula><mml:math id="M91" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> (AIFS Revised), for a forecast issued the 1 June 2023 at 00:00 UTC. Pearson <inline-formula><mml:math id="M92" display="inline"><mml:mi>r</mml:mi></mml:math></inline-formula> between <inline-formula><mml:math id="M93" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> and physical drivers across three regimes: negative space (<inline-formula><mml:math id="M94" display="inline"><mml:mrow><mml:mi mathvariant="italic">η</mml:mi><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>): high correlation with moisture variables (<inline-formula><mml:math id="M95" display="inline"><mml:mrow><mml:msub><mml:mi>q</mml:mi><mml:mn mathvariant="normal">1000</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, TCW) identifies <inline-formula><mml:math id="M96" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> as a structured saturation deficit proxy (left panel). Light rain (<inline-formula><mml:math id="M97" display="inline"><mml:mrow><mml:mn mathvariant="normal">0</mml:mn><mml:mo>&lt;</mml:mo><mml:mi mathvariant="italic">η</mml:mi><mml:mo>≤</mml:mo><mml:mn mathvariant="normal">0.5</mml:mn></mml:mrow></mml:math></inline-formula> mm per 6 h): systematic weakening of correlation, likely associated with enhanced stochasticity in this regime (center panel). Moderate rain (<inline-formula><mml:math id="M98" display="inline"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>&lt;</mml:mo><mml:mi mathvariant="italic">η</mml:mi><mml:mo>≤</mml:mo><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula> mm per 6 h): transition to dynamic control, with vertical velocity (<inline-formula><mml:math id="M99" display="inline"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mn mathvariant="normal">500</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>) as the dominant predictor (<inline-formula><mml:math id="M100" display="inline"><mml:mrow><mml:mi>r</mml:mi><mml:mo>≈</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.5</mml:mn></mml:mrow></mml:math></inline-formula>) (right panel). Analysis covers a 120 h global forecast.</p></caption>
            <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f16.png"/>

          </fig>

      <p id="d2e2963">We computed the Pearson correlation coefficient (<inline-formula><mml:math id="M101" display="inline"><mml:mi>r</mml:mi></mml:math></inline-formula>) between the pre-activation field <inline-formula><mml:math id="M102" display="inline"><mml:mi mathvariant="italic">η</mml:mi></mml:math></inline-formula> and five key physical drivers: Total Column Water (TCW), Specific Humidity (<inline-formula><mml:math id="M103" display="inline"><mml:mrow><mml:msub><mml:mi>q</mml:mi><mml:mn mathvariant="normal">1000</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>), 2 m Dewpoint (<inline-formula><mml:math id="M104" display="inline"><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>d</mml:mi></mml:mrow></mml:math></inline-formula>), Mean Sea Level Pressure (MSLP), and mid-tropospheric Vertical Velocity (<inline-formula><mml:math id="M105" display="inline"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mn mathvariant="normal">500</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>). As shown in Fig. <xref ref-type="fig" rid="F16"/>, the results reveal a clear regime-dependent physical logic: <list list-type="bullet"><list-item>
      <p id="d2e3017"><italic>Negative regime</italic> (<inline-formula><mml:math id="M106" display="inline"><mml:mrow><mml:mi mathvariant="italic">η</mml:mi><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>): we observe stable correlations (<inline-formula><mml:math id="M107" display="inline"><mml:mrow><mml:mi>r</mml:mi><mml:mo>≈</mml:mo><mml:mn mathvariant="normal">0.3</mml:mn></mml:mrow></mml:math></inline-formula>) with moisture variables (<inline-formula><mml:math id="M108" display="inline"><mml:mrow><mml:msub><mml:mi>q</mml:mi><mml:mn mathvariant="normal">1000</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, TCW, and <inline-formula><mml:math id="M109" display="inline"><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>d</mml:mi></mml:mrow></mml:math></inline-formula>). This confirms that the negative space encodes a structured representation of the <italic>saturation deficit</italic>, kept physically consistent by gradients flowing from the prognostic moisture fields.</p></list-item><list-item>
      <p id="d2e3071"><italic>Light precipitation</italic> (<inline-formula><mml:math id="M110" display="inline"><mml:mrow><mml:mn mathvariant="normal">0</mml:mn><mml:mo>&lt;</mml:mo><mml:mi mathvariant="italic">η</mml:mi><mml:mo>≤</mml:mo><mml:mn mathvariant="normal">0.5</mml:mn></mml:mrow></mml:math></inline-formula> mm): correlation with specific humidity, 2m dewpoint and total column water is substantially reduced in this regime. The weaker relationships are consistent with a lower signal-to-noise ratio and increased sensitivity to small-scale or non-linear processes.</p></list-item><list-item>
      <p id="d2e3093"><italic>Moderate precipitation</italic> (<inline-formula><mml:math id="M111" display="inline"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>&lt;</mml:mo><mml:mi mathvariant="italic">η</mml:mi><mml:mo>≤</mml:mo><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula> mm): the model transitions to dynamic control. While moisture correlations remain moderate, Vertical Velocity (<inline-formula><mml:math id="M112" display="inline"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mn mathvariant="normal">500</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>) emerges as the primary physical driver (<inline-formula><mml:math id="M113" display="inline"><mml:mrow><mml:mi>r</mml:mi><mml:mo>≈</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.5</mml:mn></mml:mrow></mml:math></inline-formula>), illustrating the model's reliance on large-scale ascent to produce deterministic rainfall.</p></list-item></list></p>
      <p id="d2e3139">While presented as a targeted demonstration of internal model behaviour, the consistency of these signals across lead times suggests that this regime-specific transition is a fundamental structural property of the AIFS architecture. These results demonstrate that the negative pre-activation field encodes valuable information regarding a proxy for saturation deficit. We acknowledge that these correlations are computed from a single 5 d forecast, which limits the temporal sampling. However, the analysis is performed on a Gaussian reduced N320 grid, such that each 6-hourly forecast field contains more than 500 000 spatial evaluation points. Although based on one forecast initialization, the large number of grid-point samples per lead time provides a substantial statistical basis for examining the internal behaviour of the model.</p>
</sec>
<sec id="Ch1.S4.SS1.SSS2">
  <label>4.1.2</label><title>Optimization geometry at the zero-precipitation boundary</title>
      <p id="d2e3150">Having established that the negative pre-activation space encodes physically meaningful information, we now turn to understanding why constraining it during training improves forecast skill for light precipitation. The mechanism can be understood by examining how the Mean Squared Error (MSE) interacts with model outputs in the vicinity of the zero-precipitation boundary for a non-bounded model: <list list-type="order"><list-item>
      <p id="d2e3155"><italic>Scenario A (Non-physical negative dry prediction)</italic>: the model predicts a non-physical negative value (<inline-formula><mml:math id="M114" display="inline"><mml:mrow><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>=</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.2</mml:mn></mml:mrow></mml:math></inline-formula> mm) for a dry observation (tp<inline-formula><mml:math id="M115" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mi mathvariant="normal">obs</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula> mm). The gradient of the Mean Squared Error (MSE) is:<disp-formula id="Ch1.E7" content-type="numbered"><label>7</label><mml:math id="M116" display="block"><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="script">L</mml:mi></mml:mrow><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="normal">tp</mml:mi></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2</mml:mn><mml:mfenced close=")" open="("><mml:mrow><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>-</mml:mo><mml:msub><mml:mi mathvariant="normal">tp</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2</mml:mn><mml:mo>(</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.2</mml:mn><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0</mml:mn><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.4</mml:mn><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Push</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi mathvariant="normal">Up</mml:mi><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p></list-item><list-item>
      <p id="d2e3259"><italic>Scenario B (Underprediction)</italic>: the truth is light rain (tp<inline-formula><mml:math id="M117" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mi mathvariant="normal">obs</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.45</mml:mn></mml:mrow></mml:math></inline-formula> mm), but the model under-predicts the intensity (<inline-formula><mml:math id="M118" display="inline"><mml:mrow><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.25</mml:mn></mml:mrow></mml:math></inline-formula> mm). The gradient is:<disp-formula id="Ch1.E8" content-type="numbered"><label>8</label><mml:math id="M119" display="block"><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="script">L</mml:mi></mml:mrow><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="normal">tp</mml:mi></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2</mml:mn><mml:mo>(</mml:mo><mml:mn mathvariant="normal">0.25</mml:mn><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.45</mml:mn><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.4</mml:mn><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Push</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi mathvariant="normal">Up</mml:mi><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p></list-item><list-item>
      <p id="d2e3341"><italic>Scenario C (Overprediction)</italic>: the truth is dry or very light rain (tp<inline-formula><mml:math id="M120" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mi mathvariant="normal">obs</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.05</mml:mn></mml:mrow></mml:math></inline-formula> mm), but the model over-predicts the intensity (<inline-formula><mml:math id="M121" display="inline"><mml:mrow><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.25</mml:mn></mml:mrow></mml:math></inline-formula> mm). The gradient is:<disp-formula id="Ch1.E9" content-type="numbered"><label>9</label><mml:math id="M122" display="block"><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="script">L</mml:mi></mml:mrow><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="normal">tp</mml:mi></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2</mml:mn><mml:mo>(</mml:mo><mml:mn mathvariant="normal">0.25</mml:mn><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.05</mml:mn><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mo>+</mml:mo><mml:mn mathvariant="normal">0.4</mml:mn><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Push</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi mathvariant="normal">Down</mml:mi><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p></list-item></list></p>
      <p id="d2e3422">Because non-physical negative dry predictions (Scenario A) and genuine drizzle underpredictions (Scenario B) produce identical upward gradients, the optimizer receives an ambiguous training signal in the vicinity of zero. The loss provides no information about why the correction is required – whether it reflects a physical regime transition (dry <inline-formula><mml:math id="M123" display="inline"><mml:mo>→</mml:mo></mml:math></inline-formula> drizzle) or merely a violation of the non-negativity constraint. One might expect the model to self-organize by  learning to place dry predictions in a compact negative range – say, around <inline-formula><mml:math id="M124" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.1</mml:mn></mml:mrow></mml:math></inline-formula> mm – thereby avoiding interference with the light-rain regime. However, this equilibrium is dynamically unstable under MSE. A dry prediction at <inline-formula><mml:math id="M125" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.1</mml:mn></mml:mrow></mml:math></inline-formula> mm receives the same upward gradient as a genuine drizzle underprediction, so stochastic gradient updates continually push dry samples toward and across zero. As a result, no stable attractor can form in the negative space.</p>
      <p id="d2e3452">Importantly, the instability is locally asymmetric around <inline-formula><mml:math id="M126" display="inline"><mml:mrow><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>. For small <inline-formula><mml:math id="M127" display="inline"><mml:mrow><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="italic">ϵ</mml:mi></mml:mrow></mml:math></inline-formula> with <inline-formula><mml:math id="M128" display="inline"><mml:mrow><mml:mi mathvariant="italic">ϵ</mml:mi><mml:mo>|</mml:mo><mml:mo>≪</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula>),

              <disp-formula id="Ch1.Ex2"><mml:math id="M129" display="block"><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="script">L</mml:mi></mml:mrow><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="normal">tp</mml:mi></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2</mml:mn><mml:mfenced close=")" open="("><mml:mrow><mml:mi mathvariant="italic">ϵ</mml:mi><mml:mo>-</mml:mo><mml:msub><mml:mi mathvariant="normal">tp</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>

            In the neighbourhood of zero, the target distribution is one-sided: <inline-formula><mml:math id="M130" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">tp</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub><mml:mo>≥</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>, with strictly positive drizzle values arbitrarily close to zero but no negative observations. Let

              <disp-formula id="Ch1.Ex3"><mml:math id="M131" display="block"><mml:mrow><mml:mi mathvariant="italic">μ</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="double-struck">E</mml:mi><mml:mfenced open="[" close="]"><mml:mrow><mml:msub><mml:mi mathvariant="normal">tp</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub><mml:mo>∣</mml:mo><mml:msub><mml:mi mathvariant="normal">tp</mml:mi><mml:mi mathvariant="normal">obs</mml:mi></mml:msub><mml:mo>≈</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:mfenced><mml:mo>,</mml:mo><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi mathvariant="normal">with</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi mathvariant="italic">μ</mml:mi><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>

            Then

              <disp-formula id="Ch1.Ex4"><mml:math id="M132" display="block"><mml:mrow><mml:mi mathvariant="double-struck">E</mml:mi><mml:mfenced close="]" open="["><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="script">L</mml:mi></mml:mrow><mml:mrow><mml:mo>∂</mml:mo><mml:mi mathvariant="normal">tp</mml:mi></mml:mrow></mml:mfrac></mml:mstyle></mml:mfenced><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2</mml:mn><mml:mo>(</mml:mo><mml:mi mathvariant="italic">ϵ</mml:mi><mml:mo>-</mml:mo><mml:mi mathvariant="italic">μ</mml:mi><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>

            Hence the expected gradient is negative for all <inline-formula><mml:math id="M133" display="inline"><mml:mrow><mml:mi mathvariant="italic">ϵ</mml:mi><mml:mo>&lt;</mml:mo><mml:mi mathvariant="italic">μ</mml:mi></mml:mrow></mml:math></inline-formula>, including the negative space. The only stationary point of the expected dynamics is <inline-formula><mml:math id="M134" display="inline"><mml:mrow><mml:mi mathvariant="italic">ϵ</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="italic">μ</mml:mi><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>, which lies strictly on the positive side. Zero is therefore not a locally stable fixed point under MSE; stochastic gradient updates induce a systematic drift that transports dry predictions across the boundary into weakly positive values.</p>
      <p id="d2e3654">As a consequence, dry predictions do not concentrate at a stable negative value but instead occupy a diffuse region centered on zero, extending into both the negative and weakly positive ranges. The interval just above zero therefore contains a superposition of displaced dry cases and genuine drizzle events. This overlap reduces representational separability and compresses the effective dynamic range available to encode variability within the light-precipitation regime.</p>
      <p id="d2e3658">By enforcing non-negativity through a ReLU constraint during training, negative pre-activations are projected to zero before loss evaluation. As a result, dry samples no longer generate corrective gradients within the negative space. Zero becomes a hard boundary rather than a distributional equilibrium, and the dry regime collapses deterministically onto this boundary point. The positive axis is therefore freed to encode light-rain variability without contamination from non-physical corrective gradients.</p>
      <p id="d2e3661">Figure <xref ref-type="fig" rid="F17"/> allows the gradient-ambiguity argument to be verified quantitatively. The three panels form a closed chain of evidence. The non-bounded model produces dry or negative outputs at only <inline-formula><mml:math id="M135" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula> % of grid points, compared to <inline-formula><mml:math id="M136" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">30</mml:mn></mml:mrow></mml:math></inline-formula> % for the bounded model. The top-right panel shows that the non-bounded model's light-precipitation frequency is inflated by almost exactly the same <inline-formula><mml:math id="M137" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">20</mml:mn></mml:mrow></mml:math></inline-formula> percentage points. The non-bounded model is not detecting  more drizzle; it is misclassifying displaced dry events as light rain. The bottom panel reveals the mechanism predicted by the expected-gradient analysis. The non-bounded model produces a narrow spike of density straddling zero, within which the dry and drizzle regimes are superimposed and statistically indistinguishable. The distribution is tightly concentrated near zero but exhibits a slight positive skew, consistent with the theoretical result that the local stationary point of the expected MSE gradient lies at a strictly positive value. In other words, the model attempts to encode dry states in the neighbourhood of zero, yet the systematic upward drift induced by <inline-formula><mml:math id="M138" display="inline"><mml:mrow><mml:mi mathvariant="double-struck">E</mml:mi><mml:mo>[</mml:mo><mml:mo>∂</mml:mo><mml:mi mathvariant="script">L</mml:mi><mml:mo>/</mml:mo><mml:mo>∂</mml:mo><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>]</mml:mo><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula> for <inline-formula><mml:math id="M139" display="inline"><mml:mrow><mml:mi mathvariant="normal">tp</mml:mi><mml:mo>&lt;</mml:mo><mml:mi mathvariant="italic">μ</mml:mi></mml:mrow></mml:math></inline-formula> prevents zero from acting as a stable attractor. The consequence is a persistent displacement of dry samples into weakly positive values, producing the observed excess of light precipitation.</p>

      <fig id="F17" specific-use="star"><label>Figure 17</label><caption><p id="d2e3737">Output distribution and discriminative capacity in the light-precipitation regime for bounded and non-bounded AIFS. The bounded model's ReLU is removed at inference to expose raw pre-activations. Top left panel: the non-bounded model produces dry or negative outputs at only <inline-formula><mml:math id="M140" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula> % of grid points versus <inline-formula><mml:math id="M141" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">30</mml:mn></mml:mrow></mml:math></inline-formula> % for the bounded model. A persistent 20-percentage-point gap across all lead times. Top right panel: the non-bounded model assigns <inline-formula><mml:math id="M142" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">60</mml:mn></mml:mrow></mml:math></inline-formula> % of grid points to the light-precipitation bin (0–0.5 mm per 6 h) versus <inline-formula><mml:math id="M143" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">40</mml:mn></mml:mrow></mml:math></inline-formula> % for the bounded model, an excess whose magnitude mirrors the dry-detection deficit almost exactly. Bottom panel: pre-activation density near zero. The non-bounded model concentrates dry and drizzle cases in an indistinguishable spike around zero; the bounded model distributes dry-state density broadly across the negative space, with 31 % of pre-activations collapsing cleanly to zero under ReLU at inference.</p></caption>
            <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f17.png"/>

          </fig>

      <p id="d2e3786">Although Fig. <xref ref-type="fig" rid="F17"/> illustrates a single 5 d forecast, the behavior is systematic rather than case-specific. This interpretation is reinforced by the Frequency Bias Index (FBI) and Peirce Skill Score (PSS) shown in Fig. <xref ref-type="fig" rid="F3"/> of the main article. The non-bounded configuration exhibits a pronounced positive frequency bias in the light-precipitation category, together with degraded discrimination skill, consistent with systematic misclassification of dry grid points as drizzle.</p>
      <p id="d2e3793">The mechanism described here provides a refined interpretation of recent findings in AI-driven precipitation forecasting. <xref ref-type="bibr" rid="bib1.bibx32" id="text.33"/> reported that drizzle bias is substantially reduced when physical constraints are applied, whereas terrain-following coordinates alone do not mitigate drizzle bias but instead improve extreme precipitation forecasts. Notably, their constraint framework combines global conservation principles with an explicit non-negativity correction.</p>
      <p id="d2e3800">The present analysis isolates the role of non-negativity enforcement and demonstrates that it addresses a fundamental gradient asymmetry at the zero-precipitation boundary. This mechanism operates at the level of local optimization dynamics and provides a distinct, mechanistically interpretable pathway for drizzle reduction. While <xref ref-type="bibr" rid="bib1.bibx32" id="text.34"/> demonstrate effectiveness of combining non-negativity with global conservation constraints, our analysis suggests that non-negativity merits investigation as an independent design element. The relative contributions of boundary enforcement versus conservation-based regularization, and their potential architecture dependence, remain important questions for future work.</p>
</sec>
</sec>
<sec id="Ch1.S4.SS2">
  <label>4.2</label><title>Case studies</title>
      <p id="d2e3815">Headline verification scores for the revised AIFS show significant improvements over the conventional numerical weather prediction model. However, building trust in AI forecasting requires more than strong overall metrics. Forecasters place great importance on the ability of the model to accurately and reliably predict weather phenomena. They also value physically plausible outputs and recognizable weather patterns. To support this, we show below selected case studies.</p>
<sec id="Ch1.S4.SS2.SSS1">
  <label>4.2.1</label><title>Storm Éowyn</title>
      <p id="d2e3826">Storm Éowyn was an unusually strong winter storm and blizzard, initially impacting much of the Gulf Coast of the United States between 20 and 22 January 2025. This storm broke snowfall records at a number of reporting stations <xref ref-type="bibr" rid="bib1.bibx35" id="paren.35"/> and represented an extreme out-of-training-distribution event with no clear analogies in the ERA5 reanalysis or the IFS Operational analysis dataset.</p>
      <p id="d2e3832">Figure <xref ref-type="fig" rid="F18"/> shows the AIFS and IFS forecasts at decreasing lead times for the affected area versus the corresponding IFS short-range forecast. The AIFS delivers an accurate forecast of snowfall for this extremely rare event. This showcases the ability of the model to accurately interpret meteorological patterns and forecast physically plausible events, even if they are far from the training data. The AIFS predicted the event with a lead time of 10 d, earlier than the IFS.</p>

      <fig id="F18" specific-use="star"><label>Figure 18</label><caption><p id="d2e3839">Snowfall forecasts for AIFS (top row panels) and IFS (middle row panels) over the Gulf Coast of America at 10, 8, 6 and 4 d lead times from left to right respectively, against IFS short-range forecasts for the snowfall event (bottom row panels). The figure shows how the snowfall event was forecast accurately 4 d ahead by both the IFS and AIFS. The AIFS forecasted the event even 10 d ahead.</p></caption>
            <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f18.png"/>

          </fig>

</sec>
<sec id="Ch1.S4.SS2.SSS2">
  <label>4.2.2</label><title>Tropical low and extreme precipitation totals in Queensland Australia</title>
      <p id="d2e3856">Starting in late January 2025, a slow-moving summer storm brought exceptional rainfall along the northeastern coast of Queensland, Australia. Within a week, rainfall accumulation totalled more than 1000 mm in some areas, according to the Bureau of Meteorology as reported in <xref ref-type="bibr" rid="bib1.bibx25" id="text.36"/>. The city of Townsville saw the equivalent of six months of rain in just 3 d and the largest weekly rainfall total was measured at a gauge in the Cardwell Range, southwest of Tully, where nearly 1700 mmfell (<xref ref-type="bibr" rid="bib1.bibx25" id="altparen.37"/>, Bureau of Meteorology measurements). Figure <xref ref-type="fig" rid="F19"/> compares forecasts from AIFS and IFS against the IMERG <xref ref-type="bibr" rid="bib1.bibx15" id="paren.38"/> final product for the period 1–3 February 2025. Both model forecasts were initialized on 30 January 2025, 2 d prior to the event. The Cardwell Range is indicated by a black star, and the city of Townsville by a cyan star. Both IFS and AIFS successfully captured the event, with 24 h rainfall accumulations exceeding 300 mm in some regions. However, the AIFS forecast exhibits a somewhat persistent signal in the 5 d lead time, predicting very high rainfall totals near the Cardwell Range. This highlights that, despite AIFS's tendency toward excessive spatial smoothing, it remains capable of accurately forecasting extreme events at medium range.</p>

      <fig id="F19" specific-use="star"><label>Figure 19</label><caption><p id="d2e3872">24 h accumulated precipitation forecasts from the AIFS (top row panels) and IFS (middle row) models, compared with IMERG observational data (bottom row panels) over northeastern Queensland for 1 to 3 February 2025. Forecasts are initialised on 30 January 2025. The black star marks the Cardwell Range, where rainfall totals exceeded 1600 mm over the week, and the cyan star marks the city of Townsville. Both models captured the core of the extreme rainfall event, with accumulations exceeding 300 mm in 24 h in some areas.</p></caption>
            <graphic xlink:href="https://gmd.copernicus.org/articles/19/4703/2026/gmd-19-4703-2026-f19.jpg"/>

          </fig>

</sec>
</sec>
</sec>
<sec id="Ch1.S5" sec-type="conclusions">
  <label>5</label><title>Discussion and conclusion</title>
      <p id="d2e3892">The revised AIFS version (1.1.0) presented here improves upon the pre-operational release through a revised training regime with more data, new forecast variables, improved stratospheric loss weights, and a bounding strategy that enforces physical constraints on the output variables. Overall, this leads to improvements of around 4 %–6 % across all variables, lead times, and pressure levels. The largest improvements, up to 12 % gains in normalized difference in the short range,  are observed in total precipitation forecasting, which benefits from the newly introduced bounding. We showed that this has a significant impact on the prediction of no rain and light precipitation. The model displays good forecast performance for out-of-training-sample case studies, accurately capturing extreme precipitation and snowfall events.</p>
      <p id="d2e3895">Data plays a crucial role in the performance of AI models. Most of the improvements non-related to precipitation in the revised version of the AIFS stem from the expansion of the training dataset and the use of more recent operational ECMWF analyses for rollout fine-tuning, as demonstrated by the controlled comparison in Fig. <xref ref-type="fig" rid="F5"/>. Since the AIFS relies on these analyses for real-time forecasting, it is important to fine-tune them regularly using up-to-date data. Regular fine-tuning with recent ECMWF analyses helps the models to adapt to shifts in the data due to new IFS model cycles.</p>
      <p id="d2e3900">Recent global AI forecasting systems, including GraphCast, Pangu-Weather, FuXi, and CREDIT, have reported persistent challenges in representing light precipitation. Positive frequency bias in the drizzle regime appears to be a recurring feature across models trained with symmetric regression losses on strictly non-negative, intermittent variables. Although these systems differ substantially in backbone architecture, from graph neural networks to transformer-based designs and modular physically constrained frameworks, the drizzle problem appears largely independent of architecture. Instead, it is closely tied to how precipitation is parameterized and constrained during training. Physical constraint methodologies offer multiple pathways for mitigating precipitation biases. Global conservation schemes may reduce drizzle indirectly by regulating total moisture budgets. The present analysis suggests that non-negativity enforcement addresses a more fundamental issue: the local gradient asymmetry at the zero boundary and the superposition of dry and wet states around zero. By introducing a hard geometric boundary at zero, the optimization  landscape is reshaped such that dry and wet regimes become separable. This mechanism operates independently of large-scale conservation principles and may therefore represent a structural requirement for stable training of intermittent variables under MSE. Alternative activation functions such as LeakyReLU, which scale negative inputs by a small factor <inline-formula><mml:math id="M144" display="inline"><mml:mi mathvariant="italic">α</mml:mi></mml:math></inline-formula> (typically 0.01), would permit gradient flow in the negative space while heavily attenuating the loss contribution from dry predictions (by a factor of <inline-formula><mml:math id="M145" display="inline"><mml:mrow><mml:msup><mml:mi mathvariant="italic">α</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>). We expect that similar regime separation would still emerge, since the cost of placing dry states deep in the negative space becomes negligible. The main practical difference is that LeakyReLU produces non-physical slightly negative output values at inference, requiring post-processing clipping. More broadly, alternative formulations that explicitly decouple the dry and wet regimes during training, such as asymmetric loss functions or dedicated classification heads for the no-rain state, represent promising directions for future work.</p>
      <p id="d2e3921">The bounding strategy presented here enforces physical realizability, non-negativity, boundedness, and inter-variable consistency, but does not impose global conservation of mass or energy. For the medium-range timescales considered in this work (up to 10 d), we expect conservation violations to remain small relative to forecast errors dominated by chaotic error growth, though a systematic quantification of mass and energy drift over extended AIFS integrations remains to be carried out.</p>
      <p id="d2e3925">Rollout fine-tuning emerges as an important factor shaping forecast behaviour, including the degree of spatial smoothing in the outputs. As the model is trained on extended lead times and optimised using a mean squared error objective, some degree of smoothing is expected. Training hyperparameters such as learning rate scheduling, number of optimisation steps, and rollout configuration can influence this behaviour and warrant further systematic investigation. In the present study, the training configuration, including a maximum rollout length of 12, was retained from the previous AIFS version to ensure consistency. The resulting Z500 power spectra (Fig. <xref ref-type="fig" rid="F6"/>) are broadly comparable to those of the previous model across scales, including the <inline-formula><mml:math id="M146" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">500</mml:mn></mml:mrow></mml:math></inline-formula> km range, with slightly improved agreement with the analysis at longer lead times. Importantly, these comparable spectral characteristics are achieved alongside overall improvements in RMSE-based skill (Fig. <xref ref-type="fig" rid="F7"/>). This indicates that the skill gains are not obtained at the expense of degraded spatial variability. While more aggressive rollout strategies may further optimise headline verification scores, understanding their impact on spatial characteristics remains an important area for future work.</p>
      <p id="d2e3942">Alongside making updates to the training schedule, we have also added new variables to the AIFS while achieving improvements in forecast skill for headline atmospheric metrics. In particular, the inclusion of soil moisture and soil temperature as prognostic variables represents an initial step toward a more complete Earth system representation within AIFS. Targeted ablation studies are planned as the land-surface component is extended in future versions. However, it remains to be seen if adding more variables and earth-system components will eventually require an increase to the latent space of the model. The additional earth-system and energy-sector variables in AIFS establish a foundation for future extensions, including ocean and wave components, expanding the number of cryospheric processes with enhanced snow modelling, and increasing the hydrological capabilities of the model. These new variables are currently taken from a consistent data source with the rest of the model variables. In the future, there is the potential to look at datasets tailored to specific earth-system components, such as ERA5-Land <xref ref-type="bibr" rid="bib1.bibx24" id="paren.39"/> and the ocean and sea-ice reanalysis system (ORAS6) <xref ref-type="bibr" rid="bib1.bibx39" id="paren.40"/>.</p>
      <p id="d2e3951">AIFS currently operates at approximately 0.25° spatial resolution with a 6 h timestep, and future work will focus on increasing both spatial and temporal resolution.</p>
      <p id="d2e3954">The AIFS development has now transitioned to the new Anemoi framework <xref ref-type="bibr" rid="bib1.bibx20 bib1.bibx26 bib1.bibx37" id="paren.41"/>. Anemoi provides tools for the whole data-driven modelling workflow, from the generation of training datasets, to scalable probabilistic training <xref ref-type="bibr" rid="bib1.bibx21" id="paren.42"/> and running real-time inference with such models. Anemoi also allows for the cataloguing and archiving of model and data checkpoints to ensure reproducibility and traceability of training and inference runs and ensure that any models developed within this framework have a clear lineage. The Anemoi framework is now being used by an increasing number of Member States of ECMWF and collaborating organisations supported by ECMWF.</p>
      <p id="d2e3963">After a successful experimental phase, AIFS has transitioned to operational status at ECMWF on 25 February 2025. It is supported 24/7 alongside ECMWF's physics-based system, the IFS. The MSE trained model is labeled AIFS Single, and its forecasts are available earlier than the ones from the physics-based model chain, due to the fast runtime of AIFS.</p>
      <p id="d2e3966">Results presented in this paper show that AIFS forecasts are highly skilful and they outperform the IFS forecasts across the vast majority of lead times and variables. They  highlight the relevance of AIFS for weather prediction. Future developments will focus on including more surface variables and exploring a wider range of applications such as climate reanalysis. The operational release of the AIFS demonstrates the commitment of ECMWF to pursue the best possible weather forecasts with both physics-based and machine learning methods.</p>
      <p id="d2e3971"><italic>Code and model availability.</italic>
<list list-type="bullet"><list-item>
      <p id="d2e3979">AIFS version 1.1.0 was fully trained using the Anemoi framework <uri>https://github.com/ecmwf/anemoi</uri> (last access: 31 March 2026). The frozen versions of the Anemoi modules used for training, together with the configuration files and the trained model checkpoint, are available in the permanent archive <xref ref-type="bibr" rid="bib1.bibx10" id="text.43"/> under  <ext-link xlink:href="https://doi.org/10.5281/zenodo.17349820" ext-link-type="DOI">10.5281/zenodo.17349820</ext-link>.</p></list-item><list-item>
      <p id="d2e3992">The model weights for version 1.1.0 are also available on the project page on Hugging Face <uri>https://huggingface.co/ecmwf/aifs-single-1.1</uri> (last access: 31 March 2026) under a Creative Commons Attribution 4.0 International (CC BY 4.0) licence and <ext-link xlink:href="https://doi.org/10.57967/hf/6415" ext-link-type="DOI">10.57967/hf/6415</ext-link> <xref ref-type="bibr" rid="bib1.bibx8" id="paren.44"/>.</p></list-item><list-item>
      <p id="d2e4005">The AIFS Single model operational forecasts are freely available under ECMWF's Open Data Creative Commons licence (<uri>https://www.ecmwf.int/en/forecasts/datasets/open-data</uri>, last access: 31 March 2026) and <ext-link xlink:href="https://doi.org/10.21957/open-data" ext-link-type="DOI">10.21957/open-data</ext-link> <xref ref-type="bibr" rid="bib1.bibx9" id="paren.45"/> and forecast charts can be seen at <uri>https://charts.ecmwf.int/?query=aifs-single</uri> (last access: 31 March 2026).</p></list-item><list-item>
      <p id="d2e4021">Further details on the model’s operationalization and data dissemination can be found at <uri>https://confluence.ecmwf.int/display/USS/OLD+-+Implementation+of+AIFS+Single+v1.0</uri> (last access: 31 March 2026).</p></list-item></list></p>
</sec>

      
      </body>
    <back><notes notes-type="dataavailability"><title>Data availability</title>

      <p id="d2e4031">ERA5 reanalysis data were obtained from the Copernicus Climate Change Service Climate Data Store (<ext-link xlink:href="https://doi.org/10.24381/cds.adbb2d47" ext-link-type="DOI">10.24381/cds.adbb2d47</ext-link>, <xref ref-type="bibr" rid="bib1.bibx14" id="altparen.46"/>). ECMWF operational analyses were retrieved from the ECMWF Forecast Datasets archive (<uri>https://www.ecmwf.int/en/forecasts/datasets</uri>, last access: 31 March 2026).</p>
  </notes><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e4047"><list list-type="bullet">
        <list-item>

      <p id="d2e4052"><italic>Experiment design and execution</italic>: GMo<sup>*</sup>, EP<sup>*</sup>, APN<sup>*</sup>, SL, MCh</p>
        </list-item>
        <list-item>

      <p id="d2e4087"><italic>Model evaluation</italic>: GMo<sup>*</sup>, EP<sup>*</sup>, APN<sup>*</sup>, ZBB<sup>*</sup>, LM, SL, MCh</p>
        </list-item>
        <list-item>

      <p id="d2e4131"><italic>Framework development (Anemoi)</italic>: SL, JD, MCh, MA, APN, MSC, SH, HC, HT, MC, CO, JP, GMe, FP, BR, GMo, EP</p>
        </list-item>
        <list-item>

      <p id="d2e4139"><italic>Manuscript writing</italic>: GMo, EP, SL, APN with input from all co-authors</p>
        </list-item>
      </list><sup>*</sup> Equal Contribution.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e4158">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e4164">Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. The authors bear the ultimate responsibility for providing appropriate place names. Views expressed in the text are those of the authors and do not necessarily reflect the views of the publisher.</p>
  </notes><ack><title>Acknowledgements</title><p id="d2e4170">We acknowledge PRACE for awarding us access to Leonardo, CINECA, Italy. We acknowledge the EuroHPC Joint Undertaking for awarding this work access to the EuroHPC supercomputer MN5, hosted by BSC in Barcelona through a EuroHPC JU Special Access call.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e4175">Ewan Pinnington's contribution is funded under the CERISE project (grant agreement no. 101082139), CERISE is funded by the European Union. Ana Prieto Nemesio's contribution is partially funded under the RODEO project (grant agreement no. 101100651), RODEO is funded by the European Union. Views and opinions expressed are however those of the author(s) only and do not necessarily reflect those of the European Union or the Commission. Neither the European Union nor the granting authority can be held responsible for them.</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e4181">This paper was edited by Po-Lun Ma and reviewed by three anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bibx1"><label>Balogh et al.(2024)Balogh, Saint-Martin, and Geoffroy</label><mixed-citation>Balogh, B., Saint-Martin, D., and Geoffroy, O.: Online Test of a Neural Network Deep Convection Parameterization in ARP-GEM1, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2410.21920" ext-link-type="DOI">10.48550/arXiv.2410.21920</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx2"><label>Ben Bouallègue et al.(2024)Ben Bouallègue, Clare, Magnusson, Gascón, Maier-Gerber, Janoušek, Rodwell, Pinault, Dramsch, Lang, Raoult, Rabier, Chevallier, Sandu, Dueben, Chantry, and Pappenberger</label><mixed-citation>Ben Bouallègue, Z., Clare, M. C. A., Magnusson, L., Gascón, E., Maier-Gerber, M., Janoušek, M., Rodwell, M., Pinault, F., Dramsch, J. S., Lang, S. T. K., Raoult, B., Rabier, F., Chevallier, M., Sandu, I., Dueben, P., Chantry, M., and Pappenberger, F.: The rise of data-driven weather forecasting: A first statistical assessment of machine learning-based weather forecasts in an operational-like context, B. Am. Meteorol. Soc., 105, E864–E883, <ext-link xlink:href="https://doi.org/10.1175/BAMS-D-23-0162.1" ext-link-type="DOI">10.1175/BAMS-D-23-0162.1</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx3"><label>Bi et al.(2023)Bi, Xie, Zhang et al.</label><mixed-citation>Bi, K., Xie, L., Zhang, H., et al.: Accurate medium-range global weather forecasting with 3D neural networks, Nature, 619, 533–538, <ext-link xlink:href="https://doi.org/10.1038/s41586-023-06185-3" ext-link-type="DOI">10.1038/s41586-023-06185-3</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx4"><label>Bonavita(2024)</label><mixed-citation>Bonavita, M.: On Some Limitations of Current Machine Learning Weather Prediction Models, Geophys. Res. Lett., 51, e2023GL107377, <ext-link xlink:href="https://doi.org/10.1029/2023GL107377" ext-link-type="DOI">10.1029/2023GL107377</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx5"><label>Bonev et al.(2025)Bonev, Kurth, Mahesh, Bisson, Kossaifi, Kashinath, Anandkumar, Collins, Pritchard, and Keller</label><mixed-citation>Bonev, B., Kurth, T., Mahesh, A., Bisson, M., Kossaifi, J., Kashinath, K., Anandkumar, A., Collins, W. D., Pritchard, M. S., and Keller, A.: FourCastNet 3: A geometric approach to probabilistic machine-learning weather forecasting at scale, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2507.12144" ext-link-type="DOI">10.48550/arXiv.2507.12144</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx6"><label>Brenowitz et al.(2025)Brenowitz, Cohen, Pathak, Mahesh, Bonev, Kurth, Durran, Harrington, and Pritchard</label><mixed-citation>Brenowitz, N. D., Cohen, Y., Pathak, J., Mahesh, A., Bonev, B., Kurth, T., Durran, D. R., Harrington, P., and Pritchard, M. S.: A Practical Probabilistic Benchmark for AI Weather Models, Geophys. Res. Lett., 52, <ext-link xlink:href="https://doi.org/10.1029/2024gl113656" ext-link-type="DOI">10.1029/2024gl113656</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx7"><label>Chen et al.(2023)Chen, Zhong, Zhang, Cheng, Xu, Qi, and Li</label><mixed-citation>Chen, L., Zhong, X., Zhang, F., Cheng, Y., Xu, Y., Qi, Y., and Li, H.: FuXi: a cascade machine learning forecasting system for 15-day global weather forecast, npj Clim. Atmos. Sci., 6, <ext-link xlink:href="https://doi.org/10.1038/s41612-023-00512-1" ext-link-type="DOI">10.1038/s41612-023-00512-1</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx8"><label>ECMWF(2025a)</label><mixed-citation>ECMWF: aifs-single-1.1 (Revision 7976552), ECMWF [code], <ext-link xlink:href="https://doi.org/10.57967/hf/6415" ext-link-type="DOI">10.57967/hf/6415</ext-link>, 2025a.</mixed-citation></ref>
      <ref id="bib1.bibx9"><label>ECMWF(2025b)</label><mixed-citation>ECMWF: Open data, ECMWF [data set], <ext-link xlink:href="https://doi.org/10.21957/OPEN-DATA" ext-link-type="DOI">10.21957/OPEN-DATA</ext-link>, 2025b.</mixed-citation></ref>
      <ref id="bib1.bibx10"><label>European Centre for Medium-Range Weather Forecasts(2025)</label><mixed-citation>European Centre for Medium-Range Weather Forecasts: AIFS 1.1.0: Permanent Archive of Checkpoints and Source Code for Training and Inference, Zenodo [code], <ext-link xlink:href="https://doi.org/10.5281/ZENODO.17349820" ext-link-type="DOI">10.5281/ZENODO.17349820</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx11"><label>Hakim and Masanam(2024)</label><mixed-citation>Hakim, G. J. and Masanam, S.: Dynamical tests of a deep-learning weather prediction model, Artif. Intel. Earth Syst., 3, <ext-link xlink:href="https://doi.org/10.1175/aies-d-23-0090" ext-link-type="DOI">10.1175/aies-d-23-0090</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx12"><label>Harder et al.(2024)Harder, Hernandez-Garcia, Ramesh, Yang, Sattigeri, Szwarcman, Watson, and Rolnick</label><mixed-citation>Harder, P., Hernandez-Garcia, A., Ramesh, V., Yang, Q., Sattigeri, P., Szwarcman, D., Watson, C., and Rolnick, D.: Hard-Constrained Deep Learning for Climate Downscaling, arXiv [preprint] <ext-link xlink:href="https://doi.org/10.48550/arXiv.2208.05424" ext-link-type="DOI">10.48550/arXiv.2208.05424</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx13"><label>Hersbach et al.(2020)Hersbach, Bell, Berrisford et al.</label><mixed-citation>Hersbach, H., Bell, B., Berrisford, P., et al.: The ERA5 global reanalysis, Q. J. Roy. Meteorol. Soc., 146, 1999–2049, <ext-link xlink:href="https://doi.org/10.1002/qj.3803" ext-link-type="DOI">10.1002/qj.3803</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx14"><label>Hersbach et al.(2023)</label><mixed-citation>Hersbach, H., Bell, B., Berrisford, P., Biavati, G., Horányi, A., Muñoz Sabater, J., Nicolas, J., Peubey, C., Radu, R., Rozum, I., Schepers, D., Simmons, A., Soci, C., Dee, D., and Thépaut, J.-N.: ERA5 hourly data on single levels from 1940 to present, Copernicus Climate Change Service (C3S) Climate Data Store (CDS) [data set], <ext-link xlink:href="https://doi.org/10.24381/cds.adbb2d47" ext-link-type="DOI">10.24381/cds.adbb2d47</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx15"><label>Huffman et al.(2023)Huffman, Stocker, Bolvin, Nelkin, and Tan</label><mixed-citation>Huffman, G. J., Stocker, E. F., Bolvin, D. T., Nelkin, E. J., and Tan, J.: GPM IMERG Final Precipitation L3 1 day 0.1 degree <inline-formula><mml:math id="M155" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 0.1 degree V07, GES DISC [data set], <ext-link xlink:href="https://doi.org/10.5067/GPM/IMERGDF/DAY/07" ext-link-type="DOI">10.5067/GPM/IMERGDF/DAY/07</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx16"><label>Jolliffe and Stephenson(2011)</label><mixed-citation>Jolliffe, I. T. and Stephenson, D. B. (Eds.): Forecast verification, in: 2nd Edn., Wiley-Blackwell, Hoboken, NJ, <ext-link xlink:href="https://doi.org/10.1002/9781119960003" ext-link-type="DOI">10.1002/9781119960003</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bibx17"><label>Keisler(2022)</label><mixed-citation>Keisler, R.: Forecasting global weather with graph neural networks, arXiv [preprint], arXiv:2202.07575, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2202.07575" ext-link-type="DOI">10.48550/arXiv.2202.07575</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx18"><label>Kent et al.(2025)Kent, Scaife, Dunstone, Smith, Hardiman, Dunstan, and Watt-Meyer</label><mixed-citation>Kent, C., Scaife, A. A., Dunstone, N. J., Smith, D., Hardiman, S. C., Dunstan, T., and Watt-Meyer, O.: Skilful global seasonal predictions from a machine learning weather model trained on reanalysis data, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2503.23953" ext-link-type="DOI">10.48550/arXiv.2503.23953</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx19"><label>Lam et al.(2023)Lam, Sanchez-Gonzalez, Willson, Wirnsberger, Fortunato, Alet, Ravuri, Ewalds, Eaton-Rosen, Hu, Merose, Hoyer, Holland, Vinyals, Stott, Pritzel, Mohamed, and Battaglia</label><mixed-citation>Lam, R., Sanchez-Gonzalez, A., Willson, M., Wirnsberger, P., Fortunato, M., Alet, F., Ravuri, S., Ewalds, T., Eaton-Rosen, Z., Hu, W., Merose, A., Hoyer, S., Holland, G., Vinyals, O., Stott, J., Pritzel, A., Mohamed, S., and Battaglia, P.: Learning skillful medium-range global weather forecasting, Science, 382, 1416–1421, <ext-link xlink:href="https://doi.org/10.1126/science.adi2336" ext-link-type="DOI">10.1126/science.adi2336</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx20"><label>Lang et al.(2024a)Lang, Alexe, Chantry, Dramsch, Pinault, Raoult, Clare, Lessig, Maier-Gerber, Magnusson, Bouallgue, Nemesio, Dueben, Brown, Pappenberger, and Rabier</label><mixed-citation>Lang, S., Alexe, M., Chantry, M., Dramsch, J., Pinault, F., Raoult, B., Clare, M. C. A., Lessig, C., Maier-Gerber, M., Magnusson, L., Bouallègue, Z. B., Nemesio, A. P., Dueben, P. D., Brown, A., Pappenberger, F., and Rabier, F.: AIFS – ECMWF's data-driven forecasting system, arXiv 9preprint], arXiv:2406.01465, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2406.01465" ext-link-type="DOI">10.48550/arXiv.2406.01465</ext-link>, 2024a.</mixed-citation></ref>
      <ref id="bib1.bibx21"><label>Lang et al.(2024b)Lang, Alexe, Clare, Roberts, Adewoyin, Bouallgue, Chantry, Dramsch, Dueben, Hahner, Maciel, Prieto-Nemesio, O'Brien, Pinault, Polster, Raoult, Tietsche, and Leutbecher</label><mixed-citation>Lang, S., Alexe, M., Clare, M. C. A., Roberts, C., Adewoyin, R., Bouallègue, Z. B., Chantry, M., Dramsch, J., Dueben, P. D., Hahner, S., Maciel, P., Prieto-Nemesio, A., O'Brien, C., Pinault, F., Polster, J., Raoult, B., Tietsche, S., and Leutbecher, M.: AIFS-CRPS: Ensemble forecasting using a model trained with a loss function based on the Continuous Ranked Probability Score, arXiv [preprint], arXiv:2412.15832, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2412.15832" ext-link-type="DOI">10.48550/arXiv.2412.15832</ext-link>, 2024b.</mixed-citation></ref>
      <ref id="bib1.bibx22"><label>Loshchilov and Hutter(2019)</label><mixed-citation>Loshchilov, I. and Hutter, F.: Decoupled Weight Decay Regularization, in: International Conference on Learning Representations, <uri>https://openreview.net/forum?id=Bkg6RiCqY7</uri> (last access: 31 March 2026), 2019.</mixed-citation></ref>
      <ref id="bib1.bibx23"><label>Micikevicius et al.(2018)Micikevicius, Narang, Alben, Diamos, Elsen, Garcia, Ginsburg, Houston, Kuchaiev, Venkatesh, and Wu</label><mixed-citation>Micikevicius, P., Narang, S., Alben, J., Diamos, G., Elsen, E., Garcia, D., Ginsburg, B., Houston, M., Kuchaiev, O., Venkatesh, G., and Wu, H.: Mixed Precision Training, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.1710.03740" ext-link-type="DOI">10.48550/arXiv.1710.03740</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx24"><label>Muñoz Sabater et al.(2021)Muñoz Sabater, Dutra, Agustí-Panareda, Albergel, Arduini, Balsamo, Boussetta, Choulga, Harrigan, Hersbach, Martens, Miralles, Piles, Rodríguez-Fernández, Zsoter, Buontempo, and Thépaut</label><mixed-citation>Muñoz Sabater, J., Dutra, E., Agustí-Panareda, A., Albergel, C., Arduini, G., Balsamo, G., Boussetta, S., Choulga, M., Harrigan, S., Hersbach, H., Martens, B., Miralles, D. G., Piles, M., Rodríguez-Fernández, N. J., Zsoter, E., Buontempo, C., and Thépaut, J.-N.: ERA5-Land: a state-of-the-art global reanalysis dataset for land applications, Earth Syst. Sci. Data, 13, 4349–4383, <ext-link xlink:href="https://doi.org/10.5194/essd-13-4349-2021" ext-link-type="DOI">10.5194/essd-13-4349-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx25"><label>NASA Earth Observatory(2025)</label><mixed-citation>NASA Earth Observatory: Rainy, Stormy Days in Queensland, NASA Earth Observatory, Visible Earth, <uri>https://earthobservatory.nasa.gov/images/153914/rainy-stormy-days-in-queensland</uri> (last access: 31 March 2026), 2025.</mixed-citation></ref>
      <ref id="bib1.bibx26"><label>Nipen et al.(2024)Nipen, Haugen, Ingstad, Nordhagen, Salihi, Tedesco, Seierstad, Kristiansen, Lang, Alexe, Dramsch, Raoult, Mertes, and Chantry</label><mixed-citation>Nipen, T. N., Haugen, H. H., Ingstad, M. S., Nordhagen, E. M., Salihi, A. F. S., Tedesco, P., Seierstad, I. A., Kristiansen, J., Lang, S., Alexe, M., Dramsch, J., Raoult, B., Mertes, G., and Chantry, M.: Regional data-driven weather modeling with a global stretched-grid, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2409.02891" ext-link-type="DOI">10.48550/arXiv.2409.02891</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx27"><label>Pathak et al.(2022)Pathak, Subramanian, Harrington, Raja, Chattopadhyay, Mardani, Kurth, Hall, Li, Azizzadenesheli, and Hassanzadeh</label><mixed-citation>Pathak, J., Subramanian, S., Harrington, P., Raja, S., Chattopadhyay, A., Mardani, M., Kurth, T., Hall, D., Li, Z., Azizzadenesheli, K., and Hassanzadeh, P.: FourCastNet: A global data-driven high-resolution weather model using adaptive fourier neural operators, arXiv [preprint], arXiv:2202.11214, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2202.11214" ext-link-type="DOI">10.48550/arXiv.2202.11214</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx28"><label>Pfeifroth et al.(2023)Pfeifroth, Kothe, Drücke, Trentmann, Schröder, Selbach, and Hollmann</label><mixed-citation>Pfeifroth, U., Kothe, S., Drücke, J., Trentmann, J., Schröder, M., Selbach, N., and Hollmann, R.: Surface Radiation Data Set – Heliosat (SARAH) – Edition 3, EUMETSAT, <ext-link xlink:href="https://doi.org/10.5676/EUM_SAF_CM/SARAH/V003" ext-link-type="DOI">10.5676/EUM_SAF_CM/SARAH/V003</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx29"><label>Rasp et al.(2024)Rasp, Hoyer, Merose, Langmore, Battaglia, Russell, Sanchez-Gonzalez, Yang, Carver, Agrawal, Chantry, Ben Bouallegue, Dueben, Bromberg, Sisk, Barrington, Bell, and Sha</label><mixed-citation>Rasp, S., Hoyer, S., Merose, A., Langmore, I., Battaglia, P., Russell, T., Sanchez-Gonzalez, A., Yang, V., Carver, R., Agrawal, S., Chantry, M., Ben Bouallegue, Z., Dueben, P., Bromberg, C., Sisk, J., Barrington, L., Bell, A., and Sha, F.: WeatherBench 2: A Benchmark for the Next Generation of Data-Driven Global Weather Models, J. Adv. Model. Earth Syst., 16, e2023MS004019, <ext-link xlink:href="https://doi.org/10.1029/2023MS004019" ext-link-type="DOI">10.1029/2023MS004019</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx30"><label>Rodwell et al.(2010)Rodwell, Richardson, Hewson, and Haiden</label><mixed-citation>Rodwell, M. J., Richardson, D. S., Hewson, T. D., and Haiden, T.: A new equitable score suitable for verifying precipitation in numerical weather prediction, Q. J. Roy. Meteorol. Soc., 136, 1344–1363, <ext-link xlink:href="https://doi.org/10.1002/qj.656" ext-link-type="DOI">10.1002/qj.656</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bibx31"><label>Schreck et al.(2025)Schreck, Sha, Chapman, Kimpara, Berner, McGinnis, Kazadi, Sobhani, Kirk, Becker, Gantos, and Gagne II</label><mixed-citation>Schreck, J. S., Sha, Y., Chapman, W., Kimpara, D., Berner, J., McGinnis, S., Kazadi, A., Sobhani, N., Kirk, B., Becker, C., Gantos, G., and Gagne II, D. J.: Community Research Earth Digital Intelligence Twin: a scalable framework for AI-driven Earth System Modeling, npj Clim. Atmos. Sci., 8, <ext-link xlink:href="https://doi.org/10.1038/s41612-025-01125-6" ext-link-type="DOI">10.1038/s41612-025-01125-6</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx32"><label>Sha et al.(2025a)Sha, Schreck, Chapman, and Gagne II</label><mixed-citation>Sha, Y., Schreck, J. S., Chapman, W., and Gagne II, D. J.: Investigating the Use of Terrain-Following Coordinates in AI-Driven Precipitation Forecasts, Geophys. Res. Lett., 52, e2025GL118478, <ext-link xlink:href="https://doi.org/10.1029/2025GL118478" ext-link-type="DOI">10.1029/2025GL118478</ext-link>, 2025a.</mixed-citation></ref>
      <ref id="bib1.bibx33"><label>Sha et al.(2025b)Sha, Schreck, Chapman, and Gagne II</label><mixed-citation>Sha, Y., Schreck, J. S., Chapman, W., and Gagne II, D. J.: Improving AI Weather Prediction Models Using Global Mass and Energy Conservation Schemes, J. Adv. Model. Earth Syst., 17, e2025MS005138, <ext-link xlink:href="https://doi.org/10.1029/2025MS005138" ext-link-type="DOI">10.1029/2025MS005138</ext-link>, 2025b.</mixed-citation></ref>
      <ref id="bib1.bibx34"><label>Subramaniam et al.(2025)Subramaniam, Durran, Pruitt, Cresswell-Clay, and Yik</label><mixed-citation>Subramaniam, A., Durran, D., Pruitt, D., Cresswell-Clay, N., and Yik, W.: Imposing the Fundamental Dynamical Constraint of Hydrostatic Balance to Improve Global ML Weather Prediction, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2506.08285" ext-link-type="DOI">10.48550/arXiv.2506.08285</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx35"><label>Thiem and Collins(2025)</label><mixed-citation>Thiem, H. and Collins, N.: Historic January 2025 Snowstorm in the Southern US, <uri>https://www.climate.gov/news-features/event-tracker/historic-january-2025-snowstorm-southern-us</uri> (last access: 31 March 2026), 2025.</mixed-citation></ref>
      <ref id="bib1.bibx36"><label>Wedi(2014)</label><mixed-citation>Wedi, N. P.: Increasing the horizontal resolution in numerical weather prediction and climate simulations: illusion or panacea?, Philos. T. Roy. Soc.. A, 372, <ext-link xlink:href="https://doi.org/10.1098/rsta.2013.0289" ext-link-type="DOI">10.1098/rsta.2013.0289</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bibx37"><label>Wijnands et al.(2025)Wijnands, Ginderachter, François, Buurman, Termonia, and den Bleeken</label><mixed-citation>Wijnands, J. S., Ginderachter, M. V., François, B., Buurman, S., Termonia, P., and den Bleeken, D. V.: A comparison of stretched-grid and limited-area modelling for data-driven regional weather forecasting, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.2507.18378" ext-link-type="DOI">10.48550/arXiv.2507.18378</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx38"><label>Wilks(2019)</label><mixed-citation>Wilks, D. S.: Statistical methods in the atmospheric sciences, in: 4th Edn., Elsevier Science Publishing, Philadelphia, PA, <ext-link xlink:href="https://doi.org/10.1016/C2017-0-03921-6" ext-link-type="DOI">10.1016/C2017-0-03921-6</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx39"><label>Zuo et al.(2024)Zuo, Alonso-Balmaseda, de Boisseson, Browne, Chrust, Keeley, Mogensen, Pelletier, de Rosnay, and Takakura</label><mixed-citation>Zuo, H., Alonso-Balmaseda, M., de Boisseson, E., Browne, P., Chrust, M., Keeley, S., Mogensen, K., Pelletier, C., de Rosnay, P., and Takakura, T.: ECMWF's next ensemble reanalysis system for ocean and sea ice: ORAS6, ECMWF Newsletter, 30–36, <ext-link xlink:href="https://doi.org/10.21957/hzd5y821lk" ext-link-type="DOI">10.21957/hzd5y821lk</ext-link>, 2024.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>AIFS Single 1.1.0: an update to ECMWF's machine-learned weather forecast model AIFS</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>Balogh et al.(2024)Balogh, Saint-Martin, and
Geoffroy</label><mixed-citation>
      
Balogh, B., Saint-Martin, D., and Geoffroy, O.: Online Test of a Neural Network Deep Convection Parameterization in ARP-GEM1, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.2410.21920" target="_blank">https://doi.org/10.48550/arXiv.2410.21920</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>Ben Bouallègue et al.(2024)Ben Bouallègue, Clare, Magnusson,
Gascón, Maier-Gerber, Janoušek, Rodwell, Pinault, Dramsch, Lang, Raoult,
Rabier, Chevallier, Sandu, Dueben, Chantry, and
Pappenberger</label><mixed-citation>
      
Ben Bouallègue, Z., Clare, M. C. A., Magnusson, L., Gascón, E.,
Maier-Gerber, M., Janoušek, M., Rodwell, M., Pinault, F., Dramsch, J. S.,
Lang, S. T. K., Raoult, B., Rabier, F., Chevallier, M., Sandu, I., Dueben,
P., Chantry, M., and Pappenberger, F.: The rise of data-driven weather
forecasting: A first statistical assessment of machine learning-based weather
forecasts in an operational-like context, B. Am. Meteorol. Soc., 105, E864–E883, <a href="https://doi.org/10.1175/BAMS-D-23-0162.1" target="_blank">https://doi.org/10.1175/BAMS-D-23-0162.1</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>Bi et al.(2023)Bi, Xie, Zhang et al.</label><mixed-citation>
      
Bi, K., Xie, L., Zhang, H., et al.: Accurate medium-range global weather
forecasting with 3D neural networks, Nature, 619, 533–538,
<a href="https://doi.org/10.1038/s41586-023-06185-3" target="_blank">https://doi.org/10.1038/s41586-023-06185-3</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>Bonavita(2024)</label><mixed-citation>
      
Bonavita, M.: On Some Limitations of Current Machine Learning Weather
Prediction Models, Geophys. Res. Lett., 51, e2023GL107377, <a href="https://doi.org/10.1029/2023GL107377" target="_blank">https://doi.org/10.1029/2023GL107377</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>Bonev et al.(2025)Bonev, Kurth, Mahesh, Bisson, Kossaifi, Kashinath, Anandkumar, Collins, Pritchard, and
Keller</label><mixed-citation>
      
Bonev, B., Kurth, T., Mahesh, A., Bisson, M., Kossaifi, J., Kashinath, K.,
Anandkumar, A., Collins, W. D., Pritchard, M. S., and Keller, A.: FourCastNet 3: A geometric approach to probabilistic machine-learning weather forecasting at scale, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.2507.12144" target="_blank">https://doi.org/10.48550/arXiv.2507.12144</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>Brenowitz et al.(2025)Brenowitz, Cohen, Pathak, Mahesh, Bonev, Kurth, Durran, Harrington, and Pritchard</label><mixed-citation>
      
Brenowitz, N. D., Cohen, Y., Pathak, J., Mahesh, A., Bonev, B., Kurth, T.,
Durran, D. R., Harrington, P., and Pritchard, M. S.: A Practical
Probabilistic Benchmark for AI Weather Models, Geophys. Res. Lett., 52, <a href="https://doi.org/10.1029/2024gl113656" target="_blank">https://doi.org/10.1029/2024gl113656</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>Chen et al.(2023)Chen, Zhong, Zhang, Cheng, Xu, Qi, and
Li</label><mixed-citation>
      
Chen, L., Zhong, X., Zhang, F., Cheng, Y., Xu, Y., Qi, Y., and Li, H.:
FuXi: a cascade machine learning forecasting system for 15-day global
weather forecast, npj Clim. Atmos. Sci., 6, <a href="https://doi.org/10.1038/s41612-023-00512-1" target="_blank">https://doi.org/10.1038/s41612-023-00512-1</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>ECMWF(2025a)</label><mixed-citation>
      
ECMWF: aifs-single-1.1 (Revision 7976552), ECMWF [code], <a href="https://doi.org/10.57967/hf/6415" target="_blank">https://doi.org/10.57967/hf/6415</a>, 2025a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>ECMWF(2025b)</label><mixed-citation>
      
ECMWF: Open data, ECMWF [data set], <a href="https://doi.org/10.21957/OPEN-DATA" target="_blank">https://doi.org/10.21957/OPEN-DATA</a>, 2025b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>European Centre for Medium-Range Weather
Forecasts(2025)</label><mixed-citation>
      
European Centre for Medium-Range Weather Forecasts: AIFS 1.1.0: Permanent
Archive of Checkpoints and Source Code for Training and Inference, Zenodo [code], <a href="https://doi.org/10.5281/ZENODO.17349820" target="_blank">https://doi.org/10.5281/ZENODO.17349820</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>Hakim and Masanam(2024)</label><mixed-citation>
      
Hakim, G. J. and Masanam, S.: Dynamical tests of a deep-learning weather
prediction model, Artif. Intel. Earth Syst., 3, <a href="https://doi.org/10.1175/aies-d-23-0090" target="_blank">https://doi.org/10.1175/aies-d-23-0090</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>Harder et al.(2024)Harder, Hernandez-Garcia, Ramesh, Yang, Sattigeri, Szwarcman, Watson, and Rolnick</label><mixed-citation>
      
Harder, P., Hernandez-Garcia, A., Ramesh, V., Yang, Q., Sattigeri, P.,
Szwarcman, D., Watson, C., and Rolnick, D.: Hard-Constrained Deep Learning
for Climate Downscaling, arXiv [preprint] <a href="https://doi.org/10.48550/arXiv.2208.05424" target="_blank">https://doi.org/10.48550/arXiv.2208.05424</a>,
2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>Hersbach et al.(2020)Hersbach, Bell, Berrisford
et al.</label><mixed-citation>
      
Hersbach, H., Bell, B., Berrisford, P., et al.: The ERA5 global reanalysis,
Q. J. Roy. Meteorol. Soc., 146, 1999–2049, <a href="https://doi.org/10.1002/qj.3803" target="_blank">https://doi.org/10.1002/qj.3803</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>Hersbach et al.(2023)</label><mixed-citation>
      
Hersbach, H., Bell, B., Berrisford, P., Biavati, G., Horányi, A., Muñoz Sabater, J., Nicolas, J., Peubey, C., Radu, R., Rozum, I., Schepers, D., Simmons, A., Soci, C., Dee, D., and Thépaut, J.-N.:
ERA5 hourly data on single levels from 1940 to present, Copernicus Climate Change Service (C3S) Climate Data Store (CDS) [data set], <a href="https://doi.org/10.24381/cds.adbb2d47" target="_blank">https://doi.org/10.24381/cds.adbb2d47</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>Huffman et al.(2023)Huffman, Stocker, Bolvin, Nelkin, and
Tan</label><mixed-citation>
      
Huffman, G. J., Stocker, E. F., Bolvin, D. T., Nelkin, E. J., and Tan, J.: GPM IMERG Final Precipitation L3 1 day 0.1 degree  ×  0.1 degree V07, GES DISC [data set], <a href="https://doi.org/10.5067/GPM/IMERGDF/DAY/07" target="_blank">https://doi.org/10.5067/GPM/IMERGDF/DAY/07</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>Jolliffe and Stephenson(2011)</label><mixed-citation>
      
Jolliffe, I. T. and Stephenson, D. B. (Eds.): Forecast verification, in:
2nd Edn., Wiley-Blackwell, Hoboken, NJ, <a href="https://doi.org/10.1002/9781119960003" target="_blank">https://doi.org/10.1002/9781119960003</a>, 2011.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>Keisler(2022)</label><mixed-citation>
      
Keisler, R.: Forecasting global weather with graph neural networks, arXiv
[preprint], arXiv:2202.07575, <a href="https://doi.org/10.48550/arXiv.2202.07575" target="_blank">https://doi.org/10.48550/arXiv.2202.07575</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>Kent et al.(2025)Kent, Scaife, Dunstone, Smith, Hardiman, Dunstan,
and Watt-Meyer</label><mixed-citation>
      
Kent, C., Scaife, A. A., Dunstone, N. J., Smith, D., Hardiman, S. C., Dunstan, T., and Watt-Meyer, O.: Skilful global seasonal predictions from a machine learning weather model trained on reanalysis data, arXiv [preprint],
<a href="https://doi.org/10.48550/arXiv.2503.23953" target="_blank">https://doi.org/10.48550/arXiv.2503.23953</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>Lam et al.(2023)Lam, Sanchez-Gonzalez, Willson, Wirnsberger,
Fortunato, Alet, Ravuri, Ewalds, Eaton-Rosen, Hu, Merose, Hoyer, Holland,
Vinyals, Stott, Pritzel, Mohamed, and Battaglia</label><mixed-citation>
      
Lam, R., Sanchez-Gonzalez, A., Willson, M., Wirnsberger, P., Fortunato, M.,
Alet, F., Ravuri, S., Ewalds, T., Eaton-Rosen, Z., Hu, W., Merose, A., Hoyer,
S., Holland, G., Vinyals, O., Stott, J., Pritzel, A., Mohamed, S., and
Battaglia, P.: Learning skillful medium-range global weather forecasting,
Science, 382, 1416–1421, <a href="https://doi.org/10.1126/science.adi2336" target="_blank">https://doi.org/10.1126/science.adi2336</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>Lang et al.(2024a)Lang, Alexe, Chantry, Dramsch,
Pinault, Raoult, Clare, Lessig, Maier-Gerber, Magnusson, Bouallgue,
Nemesio, Dueben, Brown, Pappenberger, and Rabier</label><mixed-citation>
      
Lang, S., Alexe, M., Chantry, M., Dramsch, J., Pinault, F., Raoult, B., Clare, M. C. A., Lessig, C., Maier-Gerber, M., Magnusson, L., Bouallègue, Z. B., Nemesio, A. P., Dueben, P. D., Brown, A., Pappenberger, F., and Rabier, F.: AIFS – ECMWF's data-driven forecasting system, arXiv 9preprint], arXiv:2406.01465, <a href="https://doi.org/10.48550/arXiv.2406.01465" target="_blank">https://doi.org/10.48550/arXiv.2406.01465</a>, 2024a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>Lang et al.(2024b)Lang, Alexe, Clare, Roberts, Adewoyin,
Bouallgue, Chantry, Dramsch, Dueben, Hahner, Maciel, Prieto-Nemesio,
O'Brien, Pinault, Polster, Raoult, Tietsche, and
Leutbecher</label><mixed-citation>
      
Lang, S., Alexe, M., Clare, M. C. A., Roberts, C., Adewoyin, R., Bouallègue, Z. B., Chantry, M., Dramsch, J., Dueben, P. D., Hahner, S., Maciel, P., Prieto-Nemesio, A., O'Brien, C., Pinault, F., Polster, J., Raoult, B., Tietsche, S., and Leutbecher, M.: AIFS-CRPS: Ensemble forecasting using a model trained with a loss function based on the Continuous Ranked Probability Score, arXiv [preprint], arXiv:2412.15832,
<a href="https://doi.org/10.48550/arXiv.2412.15832" target="_blank">https://doi.org/10.48550/arXiv.2412.15832</a>, 2024b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>Loshchilov and Hutter(2019)</label><mixed-citation>
      
Loshchilov, I. and Hutter, F.: Decoupled Weight Decay Regularization, in:
International Conference on Learning Representations,
<a href="https://openreview.net/forum?id=Bkg6RiCqY7" target="_blank"/> (last access: 31 March 2026), 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>Micikevicius et al.(2018)Micikevicius, Narang, Alben, Diamos, Elsen, Garcia, Ginsburg, Houston, Kuchaiev, Venkatesh, and
Wu</label><mixed-citation>
      
Micikevicius, P., Narang, S., Alben, J., Diamos, G., Elsen, E., Garcia, D.,
Ginsburg, B., Houston, M., Kuchaiev, O., Venkatesh, G., and Wu, H.: Mixed
Precision Training, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.1710.03740" target="_blank">https://doi.org/10.48550/arXiv.1710.03740</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>Muñoz Sabater et al.(2021)Muñoz Sabater, Dutra,
Agustí-Panareda, Albergel, Arduini, Balsamo, Boussetta, Choulga,
Harrigan, Hersbach, Martens, Miralles, Piles, Rodríguez-Fernández,
Zsoter, Buontempo, and Thépaut</label><mixed-citation>
      
Muñoz Sabater, J., Dutra, E., Agustí-Panareda, A., Albergel, C.,
Arduini, G., Balsamo, G., Boussetta, S., Choulga, M., Harrigan, S., Hersbach,
H., Martens, B., Miralles, D. G., Piles, M., Rodríguez-Fernández, N. J., Zsoter, E., Buontempo, C., and Thépaut, J.-N.: ERA5-Land: a
state-of-the-art global reanalysis dataset for land applications, Earth
Syst. Sci. Data, 13, 4349–4383, <a href="https://doi.org/10.5194/essd-13-4349-2021" target="_blank">https://doi.org/10.5194/essd-13-4349-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>NASA Earth Observatory(2025)</label><mixed-citation>
      
NASA Earth Observatory: Rainy, Stormy Days in Queensland, NASA Earth Observatory, Visible Earth,
<a href="https://earthobservatory.nasa.gov/images/153914/rainy-stormy-days-in-queensland" target="_blank"/> (last access: 31 March 2026), 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>Nipen et al.(2024)Nipen, Haugen, Ingstad, Nordhagen, Salihi, Tedesco, Seierstad, Kristiansen, Lang, Alexe, Dramsch, Raoult, Mertes, and Chantry</label><mixed-citation>
      
Nipen, T. N., Haugen, H. H., Ingstad, M. S., Nordhagen, E. M., Salihi, A.
F. S., Tedesco, P., Seierstad, I. A., Kristiansen, J., Lang, S., Alexe, M.,
Dramsch, J., Raoult, B., Mertes, G., and Chantry, M.: Regional data-driven
weather modeling with a global stretched-grid, arXiv [preprint],
<a href="https://doi.org/10.48550/arXiv.2409.02891" target="_blank">https://doi.org/10.48550/arXiv.2409.02891</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>Pathak et al.(2022)Pathak, Subramanian, Harrington, Raja,
Chattopadhyay, Mardani, Kurth, Hall, Li, Azizzadenesheli, and
Hassanzadeh</label><mixed-citation>
      
Pathak, J., Subramanian, S., Harrington, P., Raja, S., Chattopadhyay, A.,
Mardani, M., Kurth, T., Hall, D., Li, Z., Azizzadenesheli, K., and
Hassanzadeh, P.: FourCastNet: A global data-driven high-resolution
weather model using adaptive fourier neural operators, arXiv [preprint],
arXiv:2202.11214, <a href="https://doi.org/10.48550/arXiv.2202.11214" target="_blank">https://doi.org/10.48550/arXiv.2202.11214</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>Pfeifroth et al.(2023)Pfeifroth, Kothe, Drücke, Trentmann,
Schröder, Selbach, and
Hollmann</label><mixed-citation>
      
Pfeifroth, U., Kothe, S., Drücke, J., Trentmann, J., Schröder, M., Selbach,
N., and Hollmann, R.: Surface Radiation Data Set – Heliosat (SARAH) – Edition 3, EUMETSAT, <a href="https://doi.org/10.5676/EUM_SAF_CM/SARAH/V003" target="_blank">https://doi.org/10.5676/EUM_SAF_CM/SARAH/V003</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>Rasp et al.(2024)Rasp, Hoyer, Merose, Langmore, Battaglia, Russell,
Sanchez-Gonzalez, Yang, Carver, Agrawal, Chantry, Ben Bouallegue, Dueben,
Bromberg, Sisk, Barrington, Bell, and Sha</label><mixed-citation>
      
Rasp, S., Hoyer, S., Merose, A., Langmore, I., Battaglia, P., Russell, T.,
Sanchez-Gonzalez, A., Yang, V., Carver, R., Agrawal, S., Chantry, M.,
Ben Bouallegue, Z., Dueben, P., Bromberg, C., Sisk, J., Barrington, L., Bell,
A., and Sha, F.: WeatherBench 2: A Benchmark for the Next Generation of
Data-Driven Global Weather Models, J. Adv. Model. Earth Syst., 16, e2023MS004019, <a href="https://doi.org/10.1029/2023MS004019" target="_blank">https://doi.org/10.1029/2023MS004019</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>Rodwell et al.(2010)Rodwell, Richardson, Hewson, and
Haiden</label><mixed-citation>
      
Rodwell, M. J., Richardson, D. S., Hewson, T. D., and Haiden, T.: A new
equitable score suitable for verifying precipitation in numerical weather
prediction, Q. J. Roy. Meteorol. Soc., 136, 1344–1363, <a href="https://doi.org/10.1002/qj.656" target="_blank">https://doi.org/10.1002/qj.656</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>Schreck et al.(2025)Schreck, Sha, Chapman, Kimpara, Berner, McGinnis, Kazadi, Sobhani, Kirk, Becker, Gantos, and Gagne II</label><mixed-citation>
      
Schreck, J. S., Sha, Y., Chapman, W., Kimpara, D., Berner, J., McGinnis, S.,
Kazadi, A., Sobhani, N., Kirk, B., Becker, C., Gantos, G., and Gagne II,
D. J.: Community Research Earth Digital Intelligence Twin: a scalable
framework for AI-driven Earth System Modeling, npj Clim. Atmos. Sci., 8, <a href="https://doi.org/10.1038/s41612-025-01125-6" target="_blank">https://doi.org/10.1038/s41612-025-01125-6</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>Sha et al.(2025a)Sha, Schreck, Chapman, and
Gagne II</label><mixed-citation>
      
Sha, Y., Schreck, J. S., Chapman, W., and Gagne II, D. J.: Investigating the
Use of Terrain-Following Coordinates in AI-Driven Precipitation Forecasts,
Geophys. Res. Lett., 52, e2025GL118478, <a href="https://doi.org/10.1029/2025GL118478" target="_blank">https://doi.org/10.1029/2025GL118478</a>, 2025a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>Sha et al.(2025b)Sha, Schreck, Chapman, and
Gagne II</label><mixed-citation>
      
Sha, Y., Schreck, J. S., Chapman, W., and Gagne II, D. J.: Improving AI Weather Prediction Models Using Global Mass and Energy Conservation Schemes, J. Adv. Model. Earth Syst., 17, e2025MS005138, <a href="https://doi.org/10.1029/2025MS005138" target="_blank">https://doi.org/10.1029/2025MS005138</a>, 2025b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>Subramaniam et al.(2025)Subramaniam, Durran, Pruitt, Cresswell-Clay, and Yik</label><mixed-citation>
      
Subramaniam, A., Durran, D., Pruitt, D., Cresswell-Clay, N., and Yik, W.:
Imposing the Fundamental Dynamical Constraint of Hydrostatic Balance to
Improve Global ML Weather Prediction, arXiv [preprint],
<a href="https://doi.org/10.48550/arXiv.2506.08285" target="_blank">https://doi.org/10.48550/arXiv.2506.08285</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>Thiem and Collins(2025)</label><mixed-citation>
      
Thiem, H. and Collins, N.: Historic January 2025 Snowstorm in the Southern
US,
<a href="https://www.climate.gov/news-features/event-tracker/historic-january-2025-snowstorm-southern-us" target="_blank"/> (last access: 31 March 2026), 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>Wedi(2014)</label><mixed-citation>
      
Wedi, N. P.: Increasing the horizontal resolution in numerical weather
prediction and climate simulations: illusion or panacea?, Philos. T. Roy. Soc.. A, 372, <a href="https://doi.org/10.1098/rsta.2013.0289" target="_blank">https://doi.org/10.1098/rsta.2013.0289</a>, 2014.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>Wijnands et al.(2025)Wijnands, Ginderachter, François, Buurman,
Termonia, and den Bleeken</label><mixed-citation>
      
Wijnands, J. S., Ginderachter, M. V., François, B., Buurman, S., Termonia, P., and den Bleeken, D. V.: A comparison of stretched-grid and limited-area
modelling for data-driven regional weather forecasting, arXiv [preprint],
<a href="https://doi.org/10.48550/arXiv.2507.18378" target="_blank">https://doi.org/10.48550/arXiv.2507.18378</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>Wilks(2019)</label><mixed-citation>
      
Wilks, D. S.: Statistical methods in the atmospheric sciences, in: 4th Edn., Elsevier Science Publishing, Philadelphia, PA, <a href="https://doi.org/10.1016/C2017-0-03921-6" target="_blank">https://doi.org/10.1016/C2017-0-03921-6</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>Zuo et al.(2024)Zuo, Alonso-Balmaseda, de Boisseson, Browne, Chrust, Keeley, Mogensen, Pelletier, de Rosnay, and Takakura</label><mixed-citation>
      
Zuo, H., Alonso-Balmaseda, M., de Boisseson, E., Browne, P., Chrust, M.,
Keeley, S., Mogensen, K., Pelletier, C., de Rosnay, P., and Takakura, T.:
ECMWF's next ensemble reanalysis system for ocean and sea ice: ORAS6, ECMWF
Newsletter, 30–36, <a href="https://doi.org/10.21957/hzd5y821lk" target="_blank">https://doi.org/10.21957/hzd5y821lk</a>, 2024.

    </mixed-citation></ref-html>--></article>
