<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="research-article">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">GMD</journal-id><journal-title-group>
    <journal-title>Geoscientific Model Development</journal-title>
    <abbrev-journal-title abbrev-type="publisher">GMD</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Geosci. Model Dev.</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1991-9603</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/gmd-19-2479-2026</article-id><title-group><article-title><inline-formula><mml:math id="M1" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation within JEDI for NOAA's regional Air Quality Model (AQMv7): application to the September 2020 Western US wildfires</article-title><alt-title><inline-formula><mml:math id="M2" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation within JEDI for NOAA's regional Air Quality Model</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes" rid="aff1 aff2">
          <name><surname>Wang</surname><given-names>Hongli</given-names></name>
          <email>hongli.wang@noaa.gov</email>
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3">
          <name><surname>Martin</surname><given-names>Cory</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4 aff5">
          <name><surname>Barré</surname><given-names>Jérôme</given-names></name>
          
        <ext-link>https://orcid.org/0009-0007-5691-5540</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff2">
          <name><surname>Li</surname><given-names>Ruifang</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Weygandt</surname><given-names>Steve</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3">
          <name><surname>Huang</surname><given-names>Jianping</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff6 aff7">
          <name><surname>Tang</surname><given-names>Youhua</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-7089-7915</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff8 aff3">
          <name><surname>Choi</surname><given-names>Hyundeok</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff8 aff3">
          <name><surname>Tangborn</surname><given-names>Andrew</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff9 aff3">
          <name><surname>Wang</surname><given-names>Kai</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff9 aff3">
          <name><surname>Liu</surname><given-names>Haixia</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff10">
          <name><surname>Lee</surname><given-names>Jeffrey</given-names></name>
          
        <ext-link>https://orcid.org/0009-0007-6124-9685</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>Cooperative Institute for Research in Environmental Sciences, University of Colorado, Boulder, CO 80305, USA</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>NOAA Global Systems Laboratory, Boulder, CO 80305, USA</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>NOAA/NWS/NCEP/EMC, College Park, MD 20740, USA</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>NASA Global Modeling and Assimilation Office, Greenbelt, MD 20771, USA</institution>
        </aff>
        <aff id="aff5"><label>5</label><institution>Morgan State University, Baltimore, MD 21251, USA</institution>
        </aff>
        <aff id="aff6"><label>6</label><institution>Center for Spatial Information Science and Systems, George Mason University, Fairfax, VA 22030, USA</institution>
        </aff>
        <aff id="aff7"><label>7</label><institution>NOAA Air Resources Laboratory (ARL), College Park, MD 20740, USA</institution>
        </aff>
        <aff id="aff8"><label>8</label><institution>SAIC@NOAA/NWS/NCEP/EMC, College Park, MD 20740, USA</institution>
        </aff>
        <aff id="aff9"><label>9</label><institution>LINKER@NOAA/NWS/NCEP/EMC, College Park, MD 20740, USA</institution>
        </aff>
        <aff id="aff10"><label>10</label><institution>School of Meteorology, University of Oklahoma, Norman, OK 73072, USA</institution>
        </aff>
      </contrib-group>
      <author-notes><corresp id="corr1">Hongli Wang (hongli.wang@noaa.gov)</corresp></author-notes><pub-date><day>27</day><month>March</month><year>2026</year></pub-date>
      
      <volume>19</volume>
      <issue>6</issue>
      <fpage>2479</fpage><lpage>2495</lpage>
      <history>
        <date date-type="received"><day>21</day><month>August</month><year>2025</year></date>
           <date date-type="rev-request"><day>29</day><month>September</month><year>2025</year></date>
           <date date-type="rev-recd"><day>22</day><month>February</month><year>2026</year></date>
           <date date-type="accepted"><day>11</day><month>March</month><year>2026</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 Hongli Wang et al.</copyright-statement>
        <copyright-year>2026</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026.html">This article is available from https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026.html</self-uri><self-uri xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026.pdf">The full text article is available as a PDF file from https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e267">This paper describes efforts to establish aerosol data assimilation capabilities for NOAA's National Air Quality Forecasting Capability (NAQFC), a regional online air quality modeling (AQM) system under NOAA's Unified Forecast System (UFS), by assimilating measurements of fine particulate matter (<inline-formula><mml:math id="M3" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, particles with aerodynamic diameters less than 2.5 <inline-formula><mml:math id="M4" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:mrow></mml:math></inline-formula>). <inline-formula><mml:math id="M5" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation is developed within the Joint Effort for Data assimilation Integration (JEDI) framework and tested using its 3D-Var data assimilation (DA) component. The <inline-formula><mml:math id="M6" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observation operator is constructed by combining newly developed <inline-formula><mml:math id="M7" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> transformation recipes in the JEDI Variable Derivation Repository (VADER) with a general spatial interpolation operator in the Unified Forward Operator (UFO).</p>

      <p id="d2e324">Cycled DA and forecast experiments were conducted from 1–21 September 2020, during a period of Western US wildfires, to assess the impact of assimilating <inline-formula><mml:math id="M8" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations from the AirNow and PurpleAir networks. The control and analysis variables include individual aerosol species, with background error standard deviations generated by scaling their respective background values. Prognostic variables such as aerosol particle number and total particulate surface area are updated accordingly following each analysis update. All DA experiments use a 3-hourly cycling interval, with <inline-formula><mml:math id="M9" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations assimilated every 3 <inline-formula><mml:math id="M10" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>. The control experiment uses the same configuration but without any data assimilation. Results show that assimilating either AirNow or PurpleAir <inline-formula><mml:math id="M11" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data reduces 1–24 <inline-formula><mml:math id="M12" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast errors in terms of mean absolute error (MAE) and root mean square error (RMSE) compared to the control run over Continental United States (CONUS).  Substantial improvements are in regions where fire events took place and largely affected by transported smoke. Overall, the assimilation of PurpleAir observations in addition to AirNow data leads to a slight reduction in 3–24 <inline-formula><mml:math id="M13" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> MAE.</p>
  </abstract>
    
<funding-group>
<award-group id="gs1">
<funding-source>National Oceanic and Atmospheric Administration</funding-source>
<award-id>NA23OAR4050200D</award-id>
<award-id>NA22OAR4320151</award-id>
</award-group>
</funding-group>
</article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e394">Particulate matter with an aerodynamic diameter of 2.5 <inline-formula><mml:math id="M14" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:mrow></mml:math></inline-formula>  or smaller (<inline-formula><mml:math id="M15" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>) is a key contributor to poor air quality in the United States, posing significant risks to public health and the environment, and contributing to substantial loss of life (Cohen et al., 2017; Colmer et al., 2020; Huang et al., 2025). Over the past few decades, poor air quality in the US has contributed to over 100 000 premature deaths annually, far exceeding fatalities from all other weather-related causes combined, which average around 500 per year (Huang et al., 2025). Given its public health significance, <inline-formula><mml:math id="M16" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> is one of the important pollutants used in calculating the Air Quality Index (AQI) – a standardized system designed to communicate daily air pollution levels to the public at the US Environmental Protection Agency (EPA). Elevated <inline-formula><mml:math id="M17" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> concentrations frequently result in “unhealthy” AQI ratings, triggering health advisories and public warnings.</p>
      <p id="d2e440"><inline-formula><mml:math id="M18" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in the United States originates from a range of both anthropogenic and natural sources. Anthropogenic sources include agricultural activities and combustion processes, such as emissions from motor vehicles, power plants, industrial facilities, and residential heating systems. Among natural sources, wildfires are a particularly significant contributor, especially in the western United States, where their frequency and intensity have escalated dramatically over the past two decades (Wen and Burke, 2021). According to the US Environmental Protection Agency (EPA), wildfires account for approximately 15 % to 30 % of total <inline-formula><mml:math id="M19" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> emissions nationwide (EPA, 2017). While national seasonal averages of <inline-formula><mml:math id="M20" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> have generally declined, summer <inline-formula><mml:math id="M21" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> concentrations in the western US have remained persistently high, primarily due to wildfire smoke (O'Dell et al., 2019). In addition to degrading air quality, wildfires have caused widespread property loss. Since 2005, more than 129 000 homes, businesses, and other structures have been destroyed by wildfire-related events (<uri>https://headwaterseconomics.org/natural-hazards/structures-destroyed-by-wildfire</uri>, last access: 18 February 2026), underscoring the urgent need for more effective strategies in air quality monitoring, forecasting, and wildfire management.</p>
      <p id="d2e489">The National Oceanic and Atmospheric Administration (NOAA) has developed an advanced regional Air Quality Modeling (AQM) prediction system within the Unified Forecast System (UFS) framework to enhance the accuracy of air quality forecasts across the United States, particularly during wildfire events (Huang et al., 2025). The National Air Quality Forecast Capability (NAQFC), operated by NOAA's National Weather Service (NWS), has been providing operational air quality forecast guidance for over 20 years, with continuous inclusion of new capabilities. Under NAQFC, the AQM version 7 was implemented and became operational on 14 May 2024. The system features online coupling of atmospheric and chemical models, allowing dynamic interactions between meteorology and atmospheric chemistry. This integration improves the representation of emissions and ensures real-time feedback of meteorological fields that influence chemical transformations and the transport of pollutants in the atmosphere. The UFS-AQM online system has consistently shown improved performance in simulating major wildfire events, including the significant wildfires in the northwestern coastal regions of the US in September 2020, and widespread smoke transport from Canadian wildfires in the summer of 2023. This system was officially implemented on 14 May 2024 as NOAA's operational air quality prediction system (AQMv7), replacing the previous offline-coupled Global Forecast System using the Finite Volume Cube-Sphere dynamical core (GFS-FV3) version 15 with the Community Multiscale Air Quality modeling system (CMAQv5.0.2) (Chen et al., 2021).</p>
      <p id="d2e492"><inline-formula><mml:math id="M22" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data assimilation (DA) has proven effective in reducing errors in air quality forecasts (e.g., Pagowski et al., 2010, 2014; Schwartz et al., 2012; Wu et al., 2015; Robichaud, 2017; Sun et al., 2020;  Lee et al., 2022; Chen et al., 2022; Ha, 2022; Park et al., 2022; Vogel et al., 2025, among others). Pagowski et al. (2010) demonstrated that fine aerosol forecasts benefit from AirNow <inline-formula><mml:math id="M23" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> DA, showing improved verification scores for a period of at least 24 <inline-formula><mml:math id="M24" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>. Schwartz et al.  (2012) found that assimilating AirNow <inline-formula><mml:math id="M25" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations significantly improved surface <inline-formula><mml:math id="M26" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts over the CONUS compared to forecasts without DA. Wu et al. (2015) reported that incorporating ground-based <inline-formula><mml:math id="M27" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations notably enhanced 24 <inline-formula><mml:math id="M28" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecasts during a severe pollution episode in Shanghai. Similarly, Chen et al. (2022) showed that assimilating multi-source <inline-formula><mml:math id="M29" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data significantly improved WRF-Chem <inline-formula><mml:math id="M30" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts with benefits lasting up to 48 <inline-formula><mml:math id="M31" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>. Lee et al. (2021) highlighted the effectiveness of assimilating ground in-situ surface <inline-formula><mml:math id="M32" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations in improving the short-term <inline-formula><mml:math id="M33" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> predictions in Northeast Asia.</p>
      <p id="d2e619">Many operational regional air quality prediction systems around the world use some form of data assimilation to initialize the forecasts. These approaches vary in complexity, ranging from simple optimal interpolation to full variational or ensemble Kalman filter methods (e.g. Robichaud et al., 2016; Wei et al., 2024; Colette et al., 2025). In NOAA's current regional air quality model (AQM) operations, aerosol and chemical initial conditions are “warm-started” using 6 <inline-formula><mml:math id="M34" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecasts from the previous model cycle. The implementation of an aerosol data assimilation system can further enhance short-term air quality forecasts by providing more accurate spatial analyses of initial aerosol distributions.</p>
      <p id="d2e630">To establish aerosol data assimilation capabilities for NOAA's regional operational AQM system, we employ the Joint Effort for Data assimilation Integration (JEDI) (Trémolet and Auligné, 2020). JEDI is a flexible, agnostic, and modern data assimilation system applicable to a wide range of forecasting systems (e.g. Liu et al., 2022; Huang et al., 2023; Sluka, 2024). JEDI offers a platform that supports efficient scientific development and facilitates the transition from research to operations. As part of a broader strategic shift, NOAA and partner agencies are transitioning their data assimilation systems to JEDI, opening the door for rapid integration of new scientific advancements, greater consistency across modeling systems, and enhanced collaboration across research communities and operational centers.</p>
      <p id="d2e633">This study aims to develop and evaluate an initial aerosol analysis capability for the NOAA's regional AQM system by assimilating <inline-formula><mml:math id="M35" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations using the JEDI three-dimensional variational (3D-Var) data assimilation framework. Compared to previous <inline-formula><mml:math id="M36" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data assimilation studies, this research adopts the NOAA's regional operational AQMv7 system and incorporates a new <inline-formula><mml:math id="M37" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> transform in JEDI for assimilating <inline-formula><mml:math id="M38" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations. In addition to evaluating the impact of assimilating AirNow <inline-formula><mml:math id="M39" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> measurements on air quality prediction, this study also examines the impact of assimilating low-cost PurpleAir observations. Although PurpleAir data are valuable for <inline-formula><mml:math id="M40" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> analysis (White et al., 2026) and real-time air quality monitoring, their potential impact on numerical air quality prediction remains insufficiently explored. To the authors' best knowledge, this is the first study to demonstrate the value of PurpleAir observations for air quality prediction during the wildfires of September 2020 using the AQMv7 system.</p>
      <p id="d2e703">The paper is organized as follows: Sect. 2 provides a description of Methodology including the NOAA's AQM system, 3D-Var approach, and JEDI <inline-formula><mml:math id="M41" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation. Experimental setup is presented in Sect. 3 including case description, AQM configuration, AirNow and PurpleAir <inline-formula><mml:math id="M42" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations and background errors setup. Results are described in Sect. 4. A summary and discussion are presented in the final section.</p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Methodology</title>
<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>AQMv7 overview</title>
      <p id="d2e743">The NOAA's regional operational AQMv7 system was developed through the online coupling of the Finite-Volume version 3 (FV3) dynamical core-based atmospheric model (Black et al., 2021) with the EPA's Community Multiscale Air Quality (CMAQ) model v5.2.0 within the UFS framework (Huang et al., 2025).  In this UFS-AQM online system, CMAQ is treated as an atmospheric chemistry column model to simulate atmospheric chemistry reactions that govern concentrations of chemical species including gas- and aerosol-phase species.  The transport terms of chemical species are handled by the FV3 dynamical core in the same way as other physics tracers (Huang et al., 2025). Aerosol module version 6 (AERO6) (Zhang et al., 2018) is utilized by CMAQ to simulate aerosol processes.</p>
</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title><inline-formula><mml:math id="M43" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation within JEDI 3D-Var</title>
      <p id="d2e765">In the JEDI framework, a series of components are provided to create a flexible, comprehensive data assimilation system (Trémolet and Auligné, 2020). The JEDI 3D-Var component is used to assimilate <inline-formula><mml:math id="M44" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> for AQMv7. The 3D-Var method is chosen for its operational feasibility, primarily due to its low computational cost and the fact that it does not require an ensemble prediction system, as is needed in (hybrid) ensemble–variational data assimilation.</p>
      <p id="d2e779">In practice, a 3D-Var data assimilation system typically uses an incremental approach to minimize a quadratic cost function which is defined in terms of the analysis increment <inline-formula><mml:math id="M45" display="inline"><mml:mrow><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:math></inline-formula> relative to the guess state <inline-formula><mml:math id="M46" display="inline"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>:

            <disp-formula id="Ch1.E1" content-type="numbered"><label>1</label><mml:math id="M47" display="block"><mml:mtable rowspacing="0.2ex" class="split" displaystyle="true" columnalign="right left"><mml:mtr><mml:mtd><mml:mrow><mml:mi>J</mml:mi><mml:mo>(</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mn mathvariant="normal">2</mml:mn></mml:mfrac></mml:mstyle><mml:mo>(</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi><mml:mo>-</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:msub><mml:mo>)</mml:mo><mml:msup><mml:mi mathvariant="bold">B</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup><mml:mo>(</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi><mml:mo>-</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd/><mml:mtd><mml:mrow><mml:mo>+</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mn mathvariant="normal">2</mml:mn></mml:mfrac></mml:mstyle><mml:mo>(</mml:mo><mml:mi mathvariant="bold">H</mml:mi><mml:mo>[</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi><mml:mo>]</mml:mo><mml:mo>-</mml:mo><mml:mi mathvariant="bold-italic">d</mml:mi><mml:mo>)</mml:mo><mml:msup><mml:mi mathvariant="bold">R</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup><mml:mo>(</mml:mo><mml:mi mathvariant="bold">H</mml:mi><mml:mo>[</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi><mml:mo>]</mml:mo><mml:mo>-</mml:mo><mml:mi mathvariant="bold-italic">d</mml:mi><mml:msup><mml:mo>)</mml:mo><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>

          Where: <list list-type="bullet"><list-item>
      <p id="d2e940"><inline-formula><mml:math id="M48" display="inline"><mml:mrow><mml:mi mathvariant="italic">δ</mml:mi><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the guess state departure from background state, which is usually taken from a previous short-term forecast.</p></list-item><list-item>
      <p id="d2e970"><bold>H</bold> is the linearized observation operator of nonlinear observation operator <inline-formula><mml:math id="M49" display="inline"><mml:mi>H</mml:mi></mml:math></inline-formula>.</p></list-item><list-item>
      <p id="d2e983"><inline-formula><mml:math id="M50" display="inline"><mml:mi mathvariant="bold">B</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M51" display="inline"><mml:mi mathvariant="bold">R</mml:mi></mml:math></inline-formula> are the background and observation error covariance matrices, respectively.</p></list-item><list-item>
      <p id="d2e1000"><inline-formula><mml:math id="M52" display="inline"><mml:mi mathvariant="bold-italic">d</mml:mi></mml:math></inline-formula> is the innovation vector, defined as:</p></list-item></list>

            <disp-formula id="Ch1.E2" content-type="numbered"><label>2</label><mml:math id="M53" display="block"><mml:mrow><mml:mi mathvariant="bold-italic">d</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="bold-italic">y</mml:mi><mml:mo>-</mml:mo><mml:mi>H</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:math></disp-formula>

          with <inline-formula><mml:math id="M54" display="inline"><mml:mi mathvariant="bold-italic">y</mml:mi></mml:math></inline-formula> representing the observation vector.</p>
      <p id="d2e1043">Once the increment <inline-formula><mml:math id="M55" display="inline"><mml:mrow><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:math></inline-formula> is obtained, the analysis state <inline-formula><mml:math id="M56" display="inline"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is reconstructed as:

            <disp-formula id="Ch1.E3" content-type="numbered"><label>3</label><mml:math id="M57" display="block"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mi mathvariant="italic">δ</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:math></disp-formula></p>
<sec id="Ch1.S2.SS2.SSS1">
  <label>2.2.1</label><title><inline-formula><mml:math id="M58" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observation operator</title>
      <p id="d2e1109">To assimilate <inline-formula><mml:math id="M59" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data, a <inline-formula><mml:math id="M60" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> transform that builds relationships between the model aerosol variables and the observed <inline-formula><mml:math id="M61" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> needs to be developed. In AQMv7, the modal approach taken in the CMAQ model represents aerosol particle size distributions as the superposition of three lognormal modes: Aitken (I), accumulation (J), and coarse (K). It predicts only three integral properties of the size distribution for each mode: the total particle number concentration, the total surface area concentration, and the total mass concentration of the individual chemical components.</p>
      <p id="d2e1145">The total <inline-formula><mml:math id="M62" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> concentration is calculated as a weighted sum of the individual aerosol concentration across these three modes:

              <disp-formula id="Ch1.E4" content-type="numbered"><label>4</label><mml:math id="M63" display="block"><mml:mtable rowspacing="0.2ex" class="split" displaystyle="true" columnalign="right left"><mml:mtr><mml:mtd><mml:mrow><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow><mml:mo>=</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mtext>ATOTI</mml:mtext><mml:mo>⋅</mml:mo><mml:mtext>PM25AT</mml:mtext><mml:mo>+</mml:mo><mml:mtext>ATOTJ</mml:mtext><mml:mo>⋅</mml:mo><mml:mtext>PM25AC</mml:mtext></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd/><mml:mtd><mml:mrow><mml:mo>+</mml:mo><mml:mtext>ATOTK</mml:mtext><mml:mo>⋅</mml:mo><mml:mtext>PM25CO</mml:mtext></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>

            Here, ATOTI, ATOTJ, and ATOTK represent the total aerosol mass concentrations in the Aitken, accumulation, and coarse modes, respectively.  For example, ATOTI is the combined mass of 14 prognostic aerosol variables in the Aitken mode from the AERO6 aerosol module. Similarly, ATOTJ and ATOTK are the aggregated mass concentrations of 49 and 7 aerosol variables in the accumulation and coarse modes, respectively. PM25AT, PM25AC, and PM25CO are mass scaling factors for the three modes that vary by location and time. The aerosol variables within the same mode share the same mass scaling factor.</p>
      <p id="d2e1205">The <inline-formula><mml:math id="M64" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observation operator is constructed by combining the newly developed <inline-formula><mml:math id="M65" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> transformation recipes in the JEDI Variable Derivation Repository (VADER) with an existing general spatial interpolation operator in the Unified Forward Operator (UFO). VADER is responsible for transforming model variables using user-defined “recipes” to generate new variables in model space. For <inline-formula><mml:math id="M66" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation, VADER computes <inline-formula><mml:math id="M67" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> from individual aerosol species using model-specific transformation, specifically using the Eq. (4) for this application. Since <inline-formula><mml:math id="M68" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> composition varies by model, these transforms are implemented within VADER to match the specific structure of the regional air quality model AQMv7. Once <inline-formula><mml:math id="M69" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> is derived in model space, UFO applies a generic spatial interpolation operator to map the model-simulated values to the observation locations, enabling computation of the observed minus forecast values.</p>
      <p id="d2e1276">The inputs for the <inline-formula><mml:math id="M70" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> transformation are mixing ratio of the 70 aerosol variables with respect to dry air, the three mass scaling factors in the three modes, and dry air density for unit conversion. The output is the <inline-formula><mml:math id="M71" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in unit <inline-formula><mml:math id="M72" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>. It is noted that a new routine (recipe) has been added to VADER to derive dry air density from air temperature, pressure, and the specific gas constant for the dry air using the ideal gas law. This is applied in cases where the dry air density is not otherwise provided for the <inline-formula><mml:math id="M73" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> calculation.</p>
      <p id="d2e1331">The new JEDI/VADER <inline-formula><mml:math id="M74" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> recipe provides nonlinear (NL), tangent linear (TL), and adjoint (AD) transforms of <inline-formula><mml:math id="M75" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> that keeps the output products in the same grid space as the input variables. Hence, the generic interpolation operator in UFO is used to connect the model-derived <inline-formula><mml:math id="M76" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> fields with observed surface <inline-formula><mml:math id="M77" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> measurements. This respects the JEDI paradigm of keeping the UFO component of the JEDI model independent.</p>
</sec>
<sec id="Ch1.S2.SS2.SSS2">
  <label>2.2.2</label><title>Background error covariance modeling</title>
      <p id="d2e1386">In a 3D-Var system, the background error covariance (BEC) determines both the spatial spreading of information from observations, and the magnitude of the analysis increments along with the observation error variance.</p>
      <p id="d2e1389">The background error covariance matrix <inline-formula><mml:math id="M78" display="inline"><mml:mi mathvariant="bold">B</mml:mi></mml:math></inline-formula> can be decomposed into a standard deviation matrix (<inline-formula><mml:math id="M79" display="inline"><mml:mi mathvariant="bold">Σ</mml:mi></mml:math></inline-formula>) and a correlation matrix (<inline-formula><mml:math id="M80" display="inline"><mml:mi mathvariant="bold">C</mml:mi></mml:math></inline-formula>), as follows:

              <disp-formula id="Ch1.E5" content-type="numbered"><label>5</label><mml:math id="M81" display="block"><mml:mrow><mml:mi mathvariant="bold">B</mml:mi><mml:mo>=</mml:mo><mml:mi mathvariant="bold">Σ</mml:mi><mml:mi mathvariant="bold">C</mml:mi><mml:mi mathvariant="bold">Σ</mml:mi></mml:mrow></mml:math></disp-formula>

            The correlation matrix <inline-formula><mml:math id="M82" display="inline"><mml:mi mathvariant="bold">C</mml:mi></mml:math></inline-formula> is generally non-diagonal. <inline-formula><mml:math id="M83" display="inline"><mml:mi mathvariant="bold">Σ</mml:mi></mml:math></inline-formula> is a diagonal matrix, with the standard deviations of the background errors for each variable on the diagonal.</p>
      <p id="d2e1444">The error modeling of the correlation matrix and standard deviations usually apply to control variables. In the first implementation of aerosol data assimilation in JEDI for AQMv7, the control variables are defined as individual forecast aerosol variables, resulting in 70 control variables for AQMv7 with the AERO6 aerosol mechanism. The setup of background error standard deviation and correlation modeling will be described in Sect. 3: Experimental setup.</p>
</sec>
<sec id="Ch1.S2.SS2.SSS3">
  <label>2.2.3</label><title>Minimization Algorithm (DRIPCG)</title>
      <p id="d2e1455">JEDI provides several minimization algorithm options. In this paper, we use the Derber–Rosati Inexact Preconditioned Conjugate Gradient (DRIPCG) algorithm (Derber and Rosati, 1989), as implemented in the JEDI's OOPS (Object-Oriented Prediction System) framework. DRIPCG has been extensively tested and is chosen here for stability and convergence efficiency.</p>
</sec>
</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Experimental setup</title>
<sec id="Ch1.S3.SS1">
  <label>3.1</label><title>The September 2020 fire event and AQMv7 system setup</title>
      <p id="d2e1475">The wildfires of September 2020 ranked among the most intense in the US in recent years. These fires produced dense smoke that initially moved westward over the Willamette Valley in western Oregon and eventually blanketed the broader region. As a result, air quality rapidly across Oregon, Washington, and Idaho deteriorated to hazardous levels, marking one of the worst air quality periods in recent decades (Mass et al., 2022). Wildfire smoke originating from California, Oregon, and Washington was injected into the free troposphere and transported across the country by prevailing winds, leading to hazy conditions in several states. According to Li et al. (2021), from August to October 2020, wildfires in the western US contributed 23 % of surface <inline-formula><mml:math id="M84" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> across CONUS, with higher contributions observed along the Pacific Coast (43 %) and in mountain region (42 %). This study focuses on the peak fire activity occurring between 1 and 21 September.</p>
      <p id="d2e1489">In this research, the model configuration is almost the same as the operational AQMv7 setup except for running over the CONUS domain with a 3-hourly cycling interval. The AQMv7 system is configured over the CONUS domain with a grid-spacing of 13 <inline-formula><mml:math id="M85" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">km</mml:mi></mml:mrow></mml:math></inline-formula> and 65 vertical levels, extending up to 0.2 <inline-formula><mml:math id="M86" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">hPa</mml:mi></mml:mrow></mml:math></inline-formula>. The system uses the Global Forecast System version 16 (GFSv16) physics package within the Common Community Physics Package (CCPP) framework to generate the meteorological fields driving air quality predictions.  Meteorological initial conditions and lateral boundary conditions are generated using GFS forecast outputs with lead times up to 30 <inline-formula><mml:math id="M87" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> at 3 <inline-formula><mml:math id="M88" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> intervals from the previous GFS cycle. Fire-related emissions are represented using real-time Regional hourly Advanced Baseline Imager (ABI) and Visible Infrared Imaging Radiometer Suite (VIIRS) Emissions (RAVE) data at 0.03° spatial resolution. Anthropogenic emissions are based on the 2016 US EPA NEI Collaborative (NEIC2016v1) modeling platform.  Gas-phase chemistry is simulated using the Carbon Bond Mechanism version 6 (CB6r3) with updated isoprene chemistry and revised photolysis rates. More detailed information including physics, chemistry options, anthropogenic emissions, and fire emissions about the model configuration can be found in Huang et al. (2025).</p>
</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title><inline-formula><mml:math id="M89" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations</title>
      <p id="d2e1543">In this study, surface <inline-formula><mml:math id="M90" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations were obtained from two sources: AirNow and PurpleAir observing networks. These datasets differ in sensor type, spatial coverage, and quality control (QC) requirements. AirNow provides regulatory-grade measurements from federal, state, and local monitoring stations, while PurpleAir is a low-cost, community-based network of air quality sensors. PurpleAir sensors are widely deployed by individuals and communities, providing real-time data on <inline-formula><mml:math id="M91" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> concentrations as well as meteorological variables such as temperature, pressure, and relative humidity. Only the data reported from outdoor <inline-formula><mml:math id="M92" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> sensors are used in this study. The PurpleAir data were available for registered users through the PurpleAir API (<uri>https://community.purpleair.com/t/api-use-guidelines/1589</uri>, last access: 18 February 2026).</p>
<sec id="Ch1.S3.SS2.SSS1">
  <label>3.2.1</label><title>PurpleAir <inline-formula><mml:math id="M93" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> quality control</title>
      <p id="d2e1601">Quality control and correction of PurpleAir data followed the methodology described in Barkjohn et al. (2021). Readers are referred to that paper for further details. The following quality control (QC) filters were applied to the raw PurpleAir <inline-formula><mml:math id="M94" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> measurements: <list list-type="bullet"><list-item>
      <p id="d2e1617">Reported <inline-formula><mml:math id="M95" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> values from two Plantower sensors within the PurpleAir sensor (channels A and B) must be nonnegative.</p></list-item><list-item>
      <p id="d2e1632">The PurpleAir sensor channel A and B consistency: <list list-type="custom"><list-item><label>–</label>
      <p id="d2e1637">Absolute difference <inline-formula><mml:math id="M96" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M97" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, <italic>or</italic></p></list-item><list-item><label>–</label>
      <p id="d2e1672">Relative difference within 61 %.</p></list-item></list></p></list-item><list-item>
      <p id="d2e1676"><inline-formula><mml:math id="M98" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> values must not exceed <inline-formula><mml:math id="M99" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">10</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> values.</p></list-item><list-item>
      <p id="d2e1701"><inline-formula><mml:math id="M100" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> values must be less than 3000 <inline-formula><mml:math id="M101" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> (upper threshold).</p></list-item><list-item>
      <p id="d2e1734">Gross check of relative humidity with range 0 %–100 %.</p></list-item></list> Only PurpleAir <inline-formula><mml:math id="M102" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> measurements that passed all the above QC criteria were retained for subsequent correction.</p>
</sec>
<sec id="Ch1.S3.SS2.SSS2">
  <label>3.2.2</label><title>PurpleAir <inline-formula><mml:math id="M103" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> correction</title>
      <p id="d2e1769">A correction is required because the PurpleAir raw data usually overestimate <inline-formula><mml:math id="M104" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> concentrations under typical ambient and smoke-impacted conditions.  Correction of PurpleAir <inline-formula><mml:math id="M105" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> measurements was performed using a multiple linear regression model based on sensor-reported <inline-formula><mml:math id="M106" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (PA) and relative humidity (RH), following the correction formula proposed by Barkjohn et al. (2021):

              <disp-formula id="Ch1.E6" content-type="numbered"><label>6</label><mml:math id="M107" display="block"><mml:mrow><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.524</mml:mn><mml:mo>×</mml:mo><mml:mtext>PA</mml:mtext><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.0862</mml:mn><mml:mo>×</mml:mo><mml:mtext>RH</mml:mtext><mml:mo>+</mml:mo><mml:mn mathvariant="normal">5.75</mml:mn></mml:mrow></mml:math></disp-formula></p>
      <p id="d2e1836">We adopt the above equation because it was United States-wide valid by fitting data from September 2017 until January 2020. In addition, although the correction was originally derived for 24 <inline-formula><mml:math id="M108" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> averaged <inline-formula><mml:math id="M109" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, it is consistent with a regression equation obtained from the September 2020 dataset based on 1 <inline-formula><mml:math id="M110" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> averaged <inline-formula><mml:math id="M111" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>.</p>
</sec>
<sec id="Ch1.S3.SS2.SSS3">
  <label>3.2.3</label><title>Observation error assignment</title>
      <p id="d2e1886">Observation error standard deviations were assigned to each network. The AirNow <inline-formula><mml:math id="M112" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observation errors were set to 5 % of the observed values.  For PurpleAir <inline-formula><mml:math id="M113" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data, the observation errors were set to 10 % of the observed values to reflect the greater uncertainty typically associated with lower-cost sensors compared with regulatory AirNow monitors. The 10 % value is also consistent with the EPA definition of acceptable measurement uncertainty, which specifies a 10 % coefficient of variation for total precision (EPA, 2006).</p>
</sec>
<sec id="Ch1.S3.SS2.SSS4">
  <label>3.2.4</label><title>Observation spatial distribution</title>
      <p id="d2e1919">Figure 1a and b shows the spatial distribution of AirNow and PurpleAir <inline-formula><mml:math id="M114" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> monitoring stations at 12:00 UTC on 16 September 2020. PurpleAir sensors are especially concentrated in densely populated areas, leading to notable spatial variability in observation coverage during the September 2020 wildfire events. Coverage is particularly dense in urban regions of the western United States (e.g. California, Oregon, Washington, Utah, Arizona and Colorado), while rural and remote areas have significantly fewer sensors, for example, Nevada and North Dakota. Figure 1c displays the time series of domain averaged <inline-formula><mml:math id="M115" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> values and station counts from the AirNow and PurpleAir networks. The number of AirNow stations ranges from approximately 800 to 900, while PurpleAir stations number between 1160 and 1300. Dropouts in the AirNow network lead to sudden decreases in station count and corresponding drops in the <inline-formula><mml:math id="M116" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> time series. In contrast, the PurpleAir network shows a general upward trend in station count, with no major data dropouts observed.</p>

      <fig id="F1" specific-use="star"><label>Figure 1</label><caption><p id="d2e1957"><bold>(a, b)</bold> Spatial distribution of AirNow(AN) and PurpleAir(PA) <inline-formula><mml:math id="M117" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> monitoring stations on 12:00 UTC 16 September 2020. For PurpleAir, only stations that passed the quality control are shown. The displayed values are the corrected concentrations calculated using Eq. (6). <bold>(c)</bold> Time series of domain averaged <inline-formula><mml:math id="M118" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> values and numbers from AirNow and PurpleAir observing networks.</p></caption>
            <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f01.png"/>

          </fig>

</sec>
</sec>
<sec id="Ch1.S3.SS3">
  <label>3.3</label><title>Background error covariance</title>
      <p id="d2e2002">In this study, the background error standard deviation (<inline-formula><mml:math id="M119" display="inline"><mml:mi mathvariant="bold">Σ</mml:mi></mml:math></inline-formula>) for each control variable is constructed based on the background forecast; specifically, the error standard deviations of an aerosol variable are prescribed as proportional to its background values.</p>
      <p id="d2e2012">The proportional scaling factor <inline-formula><mml:math id="M120" display="inline"><mml:mi>s</mml:mi></mml:math></inline-formula> is approximately estimated by building a linear relationship between the <inline-formula><mml:math id="M121" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> standard error (<inline-formula><mml:math id="M122" display="inline"><mml:mi mathvariant="bold">Σ</mml:mi></mml:math></inline-formula>) and the background forecast <inline-formula><mml:math id="M123" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn><mml:mtext>bkg</mml:mtext></mml:msubsup></mml:mrow></mml:math></inline-formula> concentrations:

            <disp-formula id="Ch1.E7" content-type="numbered"><label>7</label><mml:math id="M124" display="block"><mml:mrow><mml:mi mathvariant="bold">Σ</mml:mi><mml:mo>=</mml:mo><mml:mi>s</mml:mi><mml:mo>⋅</mml:mo><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn><mml:mtext>bkg</mml:mtext></mml:msubsup></mml:mrow></mml:mrow></mml:math></disp-formula>

          The scaling factor <inline-formula><mml:math id="M125" display="inline"><mml:mi>s</mml:mi></mml:math></inline-formula> is subsequently applied to all <inline-formula><mml:math id="M126" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> components, i.e., the 70 prognostic aerosol variables, to construct their error standard deviations.</p>
      <p id="d2e2094">This proportionality-based approach has also been adopted in the MOCAGE operational system (Colette et al., 2024), where background error standard deviations are similarly prescribed relative to background concentrations as a first-order approximation.</p>
      <p id="d2e2097">Tang et al. (2023) tested a similar method, in which the background <inline-formula><mml:math id="M127" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> error variance is first estimated using the Hollingsworth–Lönnberg method (Hollingsworth and Lönnberg, 1986). A linear relationship is then established between the estimated <inline-formula><mml:math id="M128" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> standard error and the background forecast <inline-formula><mml:math id="M129" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn><mml:mtext>bkg</mml:mtext></mml:msubsup></mml:mrow></mml:math></inline-formula>.</p>
      <p id="d2e2136">Here we take the same idea but using an alternative approach to roughly estimate the background <inline-formula><mml:math id="M130" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecast error variance. The background <inline-formula><mml:math id="M131" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> error variance (<inline-formula><mml:math id="M132" display="inline"><mml:mrow><mml:msup><mml:mi mathvariant="bold">Σ</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>) is estimated using <inline-formula><mml:math id="M133" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> innovation information <inline-formula><mml:math id="M134" display="inline"><mml:mi mathvariant="bold-italic">d</mml:mi></mml:math></inline-formula> defined in the Sect. 2.2, and observation error information <inline-formula><mml:math id="M135" display="inline"><mml:mi mathvariant="bold">R</mml:mi></mml:math></inline-formula> specified in the Sect. 3.2.3, specifically,

            <disp-formula id="Ch1.E8" content-type="numbered"><label>8</label><mml:math id="M136" display="block"><mml:mrow><mml:msup><mml:mi mathvariant="bold">Σ</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mi>E</mml:mi><mml:mo>(</mml:mo><mml:mi mathvariant="bold-italic">d</mml:mi><mml:msup><mml:mi mathvariant="bold-italic">d</mml:mi><mml:mi mathvariant="normal">T</mml:mi></mml:msup><mml:mo>)</mml:mo><mml:mo>-</mml:mo><mml:mi mathvariant="bold">R</mml:mi></mml:mrow></mml:math></disp-formula>

          In Eq. (8), <inline-formula><mml:math id="M137" display="inline"><mml:mrow><mml:mi>E</mml:mi><mml:mo>(</mml:mo><mml:mo>⋅</mml:mo><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula> denotes the mathematical expectation operator. The superscript T denotes the transpose of a vector. Equation (8) is valid under the assumption that observation and background errors are uncorrelated. This assumption is reasonable when the innovation vector <inline-formula><mml:math id="M138" display="inline"><mml:mi mathvariant="bold-italic">d</mml:mi></mml:math></inline-formula> is calculated using forecasts from a free-running model without any aerosol data assimilation.</p>
      <p id="d2e2249">In this study, short-term (e.g., 3 <inline-formula><mml:math id="M139" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>) <inline-formula><mml:math id="M140" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts from a free run conducted during 1–21 September 2020 were used to compute the innovation vector <inline-formula><mml:math id="M141" display="inline"><mml:mi mathvariant="bold-italic">d</mml:mi></mml:math></inline-formula>. This free run, referred to as the <italic>control run</italic>, is described in detail in the following section. Using the innovations and observation errors from Sects. 2.2 and 3.2.3 as inputs to Eq. (8), the background error variance of <inline-formula><mml:math id="M142" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> was first estimated. This error, along with the background values, was then used in Eq. (7) to estimate the scaling factor, <inline-formula><mml:math id="M143" display="inline"><mml:mi>s</mml:mi></mml:math></inline-formula>. This scaling factor was subsequently applied in all assimilation experiments presented in this study.</p>
      <p id="d2e2300">This proportionality-based approach implicitly assumes that displacement errors and severe background underprediction errors do not dominate, thereby focusing the assimilation process on correcting amplitude. It offers several benefits: <list list-type="bullet"><list-item>
      <p id="d2e2305">It helps constrain analysis increments to physically meaningful regions. For example, it prevents the generation of sea salt aerosol increments over inland areas where no sea salt is present in the background. This is a problem that can occur when using GSI's height-dependent or latitude–height-dependent background error variance formulations, particularly when individual aerosol species are used as control variables.</p></list-item><list-item>
      <p id="d2e2309">It introduces location- and time-dependent background error variance information, improving the realism of background error specification.  Moreover, the aerosol variables that dominate background errors vary by location and assimilation cycle, rather than being consistently dominated by the same species when using constant static background error statistics. For example, organic and black carbon typically exhibit the largest errors in wildfire regions and downwind areas affected by smoke, whereas other regions may be dominated by non-organic aerosols.</p></list-item></list></p>
      <p id="d2e2312">An example of domain averaged background <inline-formula><mml:math id="M144" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> error standard deviation from a data assimilation run that assimilated both AirNow and PurpleAir <inline-formula><mml:math id="M145" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> is shown in Fig. 2. This figure is intended to illustrate the main difference to static constant background errors, though the actual errors used in the data assimilation experiments are the errors of the individual aerosol control variables. It is obvious that this approach produces dynamically location- and time-dependent varying error estimates that yield particularly large error variances during the peak fire events from 10–20 September 2020.</p>

      <fig id="F2"><label>Figure 2</label><caption><p id="d2e2339">Domain averaged <inline-formula><mml:math id="M146" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> error standard deviations for the data assimilation run that assimilated both AirNow and PurpleAir <inline-formula><mml:math id="M147" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f02.png"/>

        </fig>

      <p id="d2e2371">The background error correlation matrix <inline-formula><mml:math id="M148" display="inline"><mml:mi mathvariant="bold">C</mml:mi></mml:math></inline-formula> is modeled using a generic diffusion correlation operator designed for short length scales, as implemented in the System-Agnostic Background Error Representation (SABER) repository (Sluka, 2024). The primary input parameters are the horizontal and vertical cutoff length scales, defined as the distances beyond which correlations are zero. A horizontal cutoff scale of 100 <inline-formula><mml:math id="M149" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">km</mml:mi></mml:mrow></mml:math></inline-formula> is applied, consistent with estimates derived from NMC statistics in previous GSI applications (Wang et al., 2021). For vertical correlations, this study uses a cutoff length scale of 12 model levels, which helps confine the influence of surface <inline-formula><mml:math id="M150" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations within the average daytime planetary boundary layer (PBL) height (<inline-formula><mml:math id="M151" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">1450</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M152" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">m</mml:mi></mml:mrow></mml:math></inline-formula>) and has demonstrated improved surface <inline-formula><mml:math id="M153" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> prediction as will be discussed in Sect. 4.</p>
</sec>
<sec id="Ch1.S3.SS4">
  <label>3.4</label><title>Update of total particle number and surface area concentrations</title>
      <p id="d2e2438">After the aerosol mass concentration has been analyzed, total particle number concentration and total surface area concentration can be updated accordingly. For simplicity, it is assumed that the ratio of the particle number concentration to total particulate volume within each mode (I, J, K) remains the same as in the background. Total particulate volume is used instead of mass mixing ratio because it is proportional to the particle number concentration (see Eq. 3 in Binkowski and Roselle, 2003). A similar assumption was adopted by Li et al. (2013) to update number concentrations for the WRF-Chem model.</p>
      <p id="d2e2441">The number of particles is updated using the following relation:

            <disp-formula id="Ch1.E9" content-type="numbered"><label>9</label><mml:math id="M154" display="block"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>×</mml:mo><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub></mml:mrow></mml:math></disp-formula>

          Where: <list list-type="bullet"><list-item>
      <p id="d2e2480"><inline-formula><mml:math id="M155" display="inline"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M156" display="inline"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are the number of particles in the analysis and background, respectively, within each mode.</p></list-item><list-item>
      <p id="d2e2505"><inline-formula><mml:math id="M157" display="inline"><mml:mrow><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M158" display="inline"><mml:mrow><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> the total particulate volumes in the analysis and background, respectively, within the same mode.</p></list-item></list></p>
      <p id="d2e2529">The total particulate volume (<inline-formula><mml:math id="M159" display="inline"><mml:mrow><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> or <inline-formula><mml:math id="M160" display="inline"><mml:mrow><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) within each mode is calculated by dividing the mass concentration of each aerosol variable by its corresponding density in that mode, and then summing the results. This updating approach implicitly assumes that changes in volume across the three modes are driven solely by variations in particle number, rather than shifts in the aerosol size distribution. The total particulate surface area within each mode is then updated using the same volume ratio, i.e., <inline-formula><mml:math id="M161" display="inline"><mml:mstyle displaystyle="false"><mml:mfrac style="text"><mml:mrow><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi>V</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle></mml:math></inline-formula> multiplied by the background surface area.</p>
      <p id="d2e2573">In preparatory work for this study, six-hourly cycling experiments (Wang et al., 2025a) have shown that updating these variables is crucial for improving AQMv7 performance. In contrast, previous work using GSI with earlier developmental versions of AQM did not update these variables, primarily because those model versions were less advanced than the current operational AQMv7. As a result, there was still significant room for improving prediction skills.</p>
</sec>
<sec id="Ch1.S3.SS5">
  <label>3.5</label><title>Experiments</title>
      <p id="d2e2585">In the operational AQMv7 configuration, aerosol initial conditions (IC) are warm-started from a previous forecast cycle. In contrast, in cycling data assimilation and forecasting experiments, the data assimilation system provides aerosol initial conditions for the subsequent forecast, while the short-term (3 <inline-formula><mml:math id="M162" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>) forecast serves as the background for the next data assimilation cycle. A schematic of the data assimilation and forecasting cycles is shown in Fig. 3.</p>

      <fig id="F3" specific-use="star"><label>Figure 3</label><caption><p id="d2e2598">A schematic of the data assimilation and forecasting cycles.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f03.png"/>

        </fig>

      <p id="d2e2607">In the assimilation cycle, JEDI updates the aerosol analysis by combining <inline-formula><mml:math id="M163" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations with the background information. The updated aerosol analysis, together with meteorological initial conditions, emissions, and other inputs, is then used to initialize the subsequent forecasts in the forecast cycle. Note that the meteorological initial conditions are not updated by JEDI but are generated from GFS forecast outputs of the previous GFS cycle.</p>
      <p id="d2e2622">Four experiments were conducted to evaluate the performance of JEDI/AQM <inline-formula><mml:math id="M164" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> DA. Table 1 provides a description of the experiments.The first experiment is a control run (CTR), in which meteorological initial and boundary conditions are updated every 3 <inline-formula><mml:math id="M165" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>, while chemical and aerosol fields are carried over from the 3 <inline-formula><mml:math id="M166" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast of the previous cycle. The other three experiments incorporate data assimilation: DA_AN, DA_PA, and DA_ANPA, which assimilate AirNow <inline-formula><mml:math id="M167" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> only, PurpleAir <inline-formula><mml:math id="M168" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> only, and both AirNow and PurpleAir <inline-formula><mml:math id="M169" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations, respectively.</p>

<table-wrap id="T1" specific-use="star"><label>Table 1</label><caption><p id="d2e2689">Descriptions of the experiments.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="4">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Experiment</oasis:entry>
         <oasis:entry colname="col2">Data</oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M170" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> Observations</oasis:entry>
         <oasis:entry colname="col4">Aerosol Fields</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Assimilation</oasis:entry>
         <oasis:entry colname="col3">Assimilated</oasis:entry>
         <oasis:entry colname="col4"/>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">CTR</oasis:entry>
         <oasis:entry colname="col2">No</oasis:entry>
         <oasis:entry colname="col3">None</oasis:entry>
         <oasis:entry colname="col4">Carried over from previous cycle's 3 <inline-formula><mml:math id="M171" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">DA_AN</oasis:entry>
         <oasis:entry colname="col2">Yes</oasis:entry>
         <oasis:entry colname="col3">AirNow <inline-formula><mml:math id="M172" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> only</oasis:entry>
         <oasis:entry colname="col4">Updated by Assimilation</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">DA_PA</oasis:entry>
         <oasis:entry colname="col2">Yes</oasis:entry>
         <oasis:entry colname="col3">PurpleAir <inline-formula><mml:math id="M173" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> only</oasis:entry>
         <oasis:entry colname="col4">Updated by Assimilation</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">DA_ANPA</oasis:entry>
         <oasis:entry colname="col2">Yes</oasis:entry>
         <oasis:entry colname="col3">AirNow + PurpleAir <inline-formula><mml:math id="M174" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4">Updated by Assimilation</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e2850">Like the CTR experiment, all DA experiments are conducted as 3-hourly cycling runs. Data assimilation is performed every 3 <inline-formula><mml:math id="M175" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>, and a 3 <inline-formula><mml:math id="M176" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast is launched at each cycle. This 3 <inline-formula><mml:math id="M177" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast serves as the background for the subsequent data assimilation and forecasting cycle. In addition, forecasts initialized at 00:00, 06:00, 12:00, and 18:00 UTC are extended to 24 <inline-formula><mml:math id="M178" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> for evaluation purposes. The experimental period spans from 12:00 UTC on 1 September to 18:00 UTC on 21 September 2020. It is noted that to reduce random sensor noise and improve comparability with the model resolution (<inline-formula><mml:math id="M179" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">13</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M180" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">km</mml:mi></mml:mrow></mml:math></inline-formula>), the PurpleAir <inline-formula><mml:math id="M181" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data were spatially averaged onto a <inline-formula><mml:math id="M182" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.1</mml:mn><mml:mi mathvariant="italic">°</mml:mi><mml:mo>×</mml:mo><mml:mn mathvariant="normal">0.1</mml:mn><mml:mi mathvariant="italic">°</mml:mi></mml:mrow></mml:math></inline-formula> latitude–longitude grid before assimilation.</p>
</sec>
</sec>
<sec id="Ch1.S4">
  <label>4</label><title>Results</title>
      <p id="d2e2940">This section provides an overview of the impact of DA on <inline-formula><mml:math id="M183" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts. A total of 80 forecasts – initialized four times daily from 00:00 UTC on 2 September to 18:00 UTC on 21 September 2020 – are used to evaluate model performance. AirNow <inline-formula><mml:math id="M184" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations are used to verify the forecast. Forecast errors are assessed using bias, mean absolute error (MAE), and root mean square error (RMSE). Forecast performance is evaluated using box plots, which illustrate the distribution, spread, and central tendency of forecast errors. Time series of <inline-formula><mml:math id="M185" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> at various forecast hours are presented to examine the temporal evolution of forecast performance. Additionally, spatial distributions of <inline-formula><mml:math id="M186" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> including observations, forecasts, forecast errors, and forecast differences are analyzed to evaluate the spatial impact of data assimilation on <inline-formula><mml:math id="M187" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> predictions.</p>
      <p id="d2e2998">Figure 4 presents the bias, mean absolute error (MAE), and root mean square error (RMSE) for the 1–24 <inline-formula><mml:math id="M188" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast of domain-averaged <inline-formula><mml:math id="M189" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. Domain averages are computed over all states in the mainland United States. From the bias statistics (Fig. 4a), it is seen that the bias in the control run follows an upward trend initially, then reverses into a downward trend. The data assimilation runs show a similar trend, as data assimilation primarily corrects the model state and does not fully resolve inherent model bias. The control run underpredicted surface <inline-formula><mml:math id="M190" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> throughout the 24 <inline-formula><mml:math id="M191" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast period by about 1 <inline-formula><mml:math id="M192" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>. This underprediction was improved in the data assimilation experiments. The two assimilated experiments, DA_AN and DA_ANPA, reduced the 1–24 <inline-formula><mml:math id="M193" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> mean bias to <inline-formula><mml:math id="M194" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.2</mml:mn></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M195" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">0.3</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M196" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, respectively. The PurpleAir <inline-formula><mml:math id="M197" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation experiment (DA_PA) also slightly improved the 1–24 <inline-formula><mml:math id="M198" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> mean bias.</p>

      <fig id="F4" specific-use="star"><label>Figure 4</label><caption><p id="d2e3127"><inline-formula><mml:math id="M199" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecast errors for 1–24 <inline-formula><mml:math id="M200" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> lead times based on 80 forecasts initialized four times daily during 2–21 September 2020. Domain-averaged over CONUS. The <inline-formula><mml:math id="M201" display="inline"><mml:mi>x</mml:mi></mml:math></inline-formula> axis represents forecast lead times from 1 to 24 <inline-formula><mml:math id="M202" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>.  <bold>(a)</bold> Bias, <bold>(b)</bold> Mean Absolute Error (MAE), <bold>(c)</bold> Root Mean Square Error (RMSE).</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f04.png"/>

      </fig>

      <p id="d2e3180">It is seen that DA_PA produces a near zero bias at 1 <inline-formula><mml:math id="M203" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast, however this is due to large positive and negative biases canceling out. Therefore, it should be used together with norms like Mean Absolute Error (MAE) and Root Mean Square Error (RMSE), which quantify the actual magnitude of forecast errors.</p>
      <p id="d2e3191">In terms of MAE and RMSE, all the three data assimilation experiments reduced the surface <inline-formula><mml:math id="M204" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecast error throughout the 24 <inline-formula><mml:math id="M205" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast period. The added value of assimilating PurpleAir <inline-formula><mml:math id="M206" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data alongside AirNow observations is evident in the consistent MAE reduction (Fig. 4b).  Its impact on RMSE (Fig. 4c) is also positive, though relatively small.  Overall, all the data assimilation experiments show improved forecast skill compared to the control run.</p>
      <p id="d2e3224">Figure 5 shows box-and-whisker plots of <inline-formula><mml:math id="M207" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecast bias. Across all forecast hours, the interquartile range (IQR) – represented by the height of the boxes – is consistently smaller for the DA experiments compared to the control run. This indicates reduced forecast error spread between the 25th and 75th percentiles and suggests more consistent forecasts in the DA experiments. Although the median forecast bias in the control run is sometimes closer to zero, the DA_ANPA experiment performs comparably in terms of central tendency while showing clear improvements in reducing the mean forecast bias, as also reflected in Fig. 4a. Among the DA experiments, DA_AN and DA_ANPA show the most consistent improvement at 24 <inline-formula><mml:math id="M208" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> lead times, with DA_ANPA slightly outperforming others during the early forecast hours (e.g., hour 1 to 12). This suggests that assimilating PurpleAir observations in addition to AirNow helps reduce bias and brings the forecasts closer to observed <inline-formula><mml:math id="M209" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> values in the short term.</p>

      <fig id="F5" specific-use="star"><label>Figure 5</label><caption><p id="d2e3259">Box-and-whisker plot of <inline-formula><mml:math id="M210" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecast bias. Orange dot: domain averaged mean; Bottom edge  =  Q1 (25th percentile); Top edge  = Q3 (75th percentile); Height  =  Interquartile Range (IQR <inline-formula><mml:math id="M211" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> Q3 <inline-formula><mml:math id="M212" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula> Q1); Horizontal line inside box: The median (50th percentile); Whiskers: Extend to the min and max values within <inline-formula><mml:math id="M213" display="inline"><mml:mrow><mml:mn mathvariant="normal">1.5</mml:mn><mml:mo>×</mml:mo></mml:mrow></mml:math></inline-formula> IQR from Q1 and Q3.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f05.png"/>

      </fig>

      <p id="d2e3303">Figure 6 shows time series of <inline-formula><mml:math id="M214" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> averaged over CONUS at forecast hours 1, 12, and 24, respectively. Consistent with the evaluations in Figs. 4 and 5, all DA experiments generally improve <inline-formula><mml:math id="M215" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts. Notably, all DA experiments help correct underpredictions during 2–9 and 14–17 September.  In addition, the substantial overprediction during 9–13 September observed in the control run is partially mitigated by the DA experiments. Among the DA experiments, DA_AN and DA_ANPA show comparable performance and both outperform DA_PA.</p>

      <fig id="F6"><label>Figure 6</label><caption><p id="d2e3331">Time series of <inline-formula><mml:math id="M216" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> averaged over CONUS for <bold>(a)</bold> forecast hour 1, <bold>(b)</bold> forecast hour 12, and <bold>(c)</bold> forecast hour 24. The <inline-formula><mml:math id="M217" display="inline"><mml:mi>y</mml:mi></mml:math></inline-formula> axis is shown on a logarithmic scale.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f06.png"/>

      </fig>

      <p id="d2e3367">While we have investigated the impact of DA on <inline-formula><mml:math id="M218" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts in terms of temporal evolution, it is also important to examine the spatial distribution of forecast fields, associated errors, and the impact of <inline-formula><mml:math id="M219" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data assimilation.</p>
      <p id="d2e3392">Figure 7 presents the spatial distribution of temporally averaged <inline-formula><mml:math id="M220" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts at forecast hour 1, based on 80 forecasts initialized four times daily (00:00, 06:00, 12:00, and 18:00 UTC) from 2–21 September.  The effects of wildfire events are clearly seen in Fig. 7a, c and e across California, Oregon, and Washington – where the fires occurred – as well as in downstream regions such as Montana, Wyoming, Utah, and Colorado impacted by smoke advection and transport.</p>

      <fig id="F7" specific-use="star"><label>Figure 7</label><caption><p id="d2e3408">Spatial distribution of average <inline-formula><mml:math id="M221" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> at forecast hour 1, based on 80 forecasts initialized four times daily (00:00, 06:00, 12:00, and 18:00 UTC) during 2–21 September.  <bold>(a)</bold> <inline-formula><mml:math id="M222" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in experiment CTR (shaded) overlaid with AirNow <inline-formula><mml:math id="M223" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations (filled dots).   <bold>(b)</bold> <inline-formula><mml:math id="M224" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> bias in experiment CTR.   <bold>(c)</bold> <inline-formula><mml:math id="M225" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in experiment DA_AN (shaded) overlaid with AirNow <inline-formula><mml:math id="M226" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations.   <bold>(d)</bold> <inline-formula><mml:math id="M227" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> difference between experiments DA_AN and CTR.  <bold>(e)</bold> <inline-formula><mml:math id="M228" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in experiment DA_PA (shaded) overlaid with AirNow <inline-formula><mml:math id="M229" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations.  <bold>(f)</bold> <inline-formula><mml:math id="M230" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> difference between experiments DA_PA and CTR.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f07.png"/>

      </fig>

      <p id="d2e3547">1 <inline-formula><mml:math id="M231" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M232" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecast errors in the control run are evident in Fig. 6a but are more clearly highlighted in Fig. 7b, which shows the difference between the control run and AirNow observations. Significant overpredictions appear along the California coast, as well as in parts of the Midwest and Northeast US, including Tennessee, Kentucky, West Virginia, and Virginia.  Conversely, notable underpredictions are found over Colorado, New Mexico, much of Texas and Oklahoma, and several Gulf Coast states.</p>
      <p id="d2e3570">Both DA_AN (Fig. 7c and d) and DA_PA (Fig. 7e and f) show similar spatial correction patterns across California, Oregon, and Washington, particularly in reducing overpredictions along the California coast. They also produce comparable large-scale adjustments across the Northeast, Midwest, and Southern US, with their spatial patterns (Fig. 7d and f) largely opposite in sign to those in the CTR–AirNow difference (Fig. 7b). This indicates that both DA experiments effectively mitigate the control run's over- and underpredictions.</p>
      <p id="d2e3573">However, the magnitude of the corrections is generally smaller in DA_PA than in DA_AN. DA_PA shows its strongest impact over Nevada, northern Utah, Colorado, and southwestern New Mexico, where it helps alleviate regional underpredictions (Fig. 7e and f). These improvements are also observed in DA_ANPA, whose spatial pattern closely resembles DA_AN except over these few states (figures not shown).</p>
      <p id="d2e3576">The above analysis shows that data assimilation effectively corrects the 1 <inline-formula><mml:math id="M233" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast errors in the control run, particularly in the DA_AN and DA_ANPA experiments. It is therefore of interest to examine how data assimilation affects longer forecast lead times. Figure 8 presents the MAE from the CTR experiment and the percentage change in MAE (%) between the data assimilation (DA) experiments and the CTR experiment at the 24 <inline-formula><mml:math id="M234" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast lead time. Negative values in Fig. 8b–d indicate a reduction in MAE.</p>

      <fig id="F8" specific-use="star"><label>Figure 8</label><caption><p id="d2e3597"><bold>(a)</bold> MAE from the control (CTR) experiment.  Percentage change in MAE (%) relative to CTR for <bold>(b)</bold> DA_AN, <bold>(c)</bold> DA_PA, and <bold>(d)</bold> DA_ANPA. The percentage change is calculated as (MAE(DA) <inline-formula><mml:math id="M235" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula> MAE(CTR)) <inline-formula><mml:math id="M236" display="inline"><mml:mo>/</mml:mo></mml:math></inline-formula> MAE(CTR) <inline-formula><mml:math id="M237" display="inline"><mml:mrow><mml:mo>×</mml:mo><mml:mn mathvariant="normal">100</mml:mn></mml:mrow></mml:math></inline-formula>.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f08.png"/>

      </fig>

      <p id="d2e3642">It is seen from Fig. 8a that the largest MAE values occur in California, Oregon, Washington, Idaho, Montana, Wyoming, Utah, Colorado, and Arizona.  The <inline-formula><mml:math id="M238" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> MAE in these states is generally greater than 10 <inline-formula><mml:math id="M239" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, with maximum values exceeding 150 <inline-formula><mml:math id="M240" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> at certain stations in California, Oregon, and Washington. In contrast, regions less affected by wildfire smoke exhibit MAE values below 10 <inline-formula><mml:math id="M241" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>.</p>
      <p id="d2e3714">All DA experiments (Fig. 8b–d) show overall reductions in MAE at most stations. MAE reduction varies by location, with substantial improvements observed in regions with large forecast errors, such as California, Oregon, Washington, and Idaho, where MAE is reduced by approximately 20 %. On average, assimilation of AirNow <inline-formula><mml:math id="M242" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations alone significantly improves the 24 <inline-formula><mml:math id="M243" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast skill, with MAE reductions of 6.6 % based on MAE percentage changes averaged over all stations. In contrast, assimilation of PurpleAir data alone reduces the MAE by only 1.7 %. Assimilating both AirNow and PurpleAir <inline-formula><mml:math id="M244" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations reduces the MAE by 7.6 %, indicating that PurpleAir data provides complementary value to AirNow in improving forecast skill.</p>
      <p id="d2e3747">In the DA_PA experiment, a few eastern coastal states from Georgia to Virginia exhibit large percentage increases in MAE. These increases are associated with relatively small absolute errors, as MAE values in the CTR experiment over these states are typically only 2–4 <inline-formula><mml:math id="M245" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">m</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> (Fig. 8a). Increased MAE is also present at several stations at the 1 <inline-formula><mml:math id="M246" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast lead time in the DA_PA experiment in these areas (figure not shown). In contrast, the MAE increase at the 24 <inline-formula><mml:math id="M247" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast lead time is much less pronounced in the experiment assimilating only AirNow <inline-formula><mml:math id="M248" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations. This behavior suggests potential quality issues in the assimilated PurpleAir data in those areas that require further investigation, although a contribution from model errors cannot be ruled out.</p>
      <p id="d2e3796">To further examine model performance across different regions, error statistics (bias, MAE, and RMSE) for the averaged 1–24 <inline-formula><mml:math id="M249" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula>
<inline-formula><mml:math id="M250" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts from the control and data assimilation experiments over the 10 EPA regions are analyzed. Figure 9 presents the EPA Regions 1–10 and Averaged 1–24 <inline-formula><mml:math id="M251" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M252" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts errors statistics in each EPA region.</p>

      <fig id="F9" specific-use="star"><label>Figure 9</label><caption><p id="d2e3839"><bold>(a)</bold> EPA Regions 1–10. Averaged 1–24 <inline-formula><mml:math id="M253" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M254" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> forecasts errors: <bold>(b)</bold> Bias, <bold>(c)</bold> MAE and <bold>(d)</bold> RMSE.</p></caption>
        <graphic xlink:href="https://gmd.copernicus.org/articles/19/2479/2026/gmd-19-2479-2026-f09.png"/>

      </fig>

      <p id="d2e3878">In terms of bias (Fig. 9b), the DA_AN and DA_ANPA forecasts show improved performance relative to the control run. The DA_PA experiment also improves bias over most EPA regions, except for increased overprediction in EPA regions 8 and 9. For MAE and RMSE, the DA_AN and DA_ANPA experiments generally show improved performance across all EPA regions. The DA_PA experiment also exhibits improved, or at least comparable, MAE relative to the control run. However, DA_PA shows slightly increased RMSE over EPA regions 1–4, while reduced RMSE is found over other EPA regions.</p>
      <p id="d2e3882">Substantial reductions in MAE and RMSE are observed over EPA regions 8–10, where fire events occurred and/or where regions were most influenced by transported smoke. This is consistent with the large 1 <inline-formula><mml:math id="M255" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> MAE reduction shown in Fig. 8. Notably, the DA_PA experiment, which assimilates PA observations alone, reduces both MAE and RMSE over EPA regions 8–10.  Assimilating PurpleAir data together with AirNow data results in slightly smaller MAE and RMSE over these regions, suggesting that PurpleAir observations nonetheless provide complementary information to AirNow in these regions.</p>
</sec>
<sec id="Ch1.S5" sec-type="conclusions">
  <label>5</label><title>Summary and discussion</title>
      <p id="d2e3902">The latest version of NOAA's regional AQM system became operational on 14 May 2024. This system is based on the online coupling of the FV3 atmospheric model with the CMAQ model within the UFS framework. To improve initial conditions for AQM and enhance predictions of wildfire impacts on air quality, the capability to assimilate <inline-formula><mml:math id="M256" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations into AQMv7 was developed within JEDI and evaluated using its 3D-Var assimilation component in this study. The developed assimilation scheme can also be used to generate analysis (reanalysis) dataset for other applications, for example, providing data for training artificial intelligent models used in air quality prediction.</p>
      <p id="d2e3916">Data assimilation experiments were conducted for the September 2020 Western US wildfire episode, using 3-hourly cycling with observations from the AirNow and PurpleAir networks. In the data assimilation experiments, the location- and time-dependent background error standard deviations of an aerosol variable are specified as proportional to its background values, using a diagnosed scaling factor. In addition to updating the analyzed aerosol variables in each mode, the particle number concentration and surface area of each mode are also updated. The results show that assimilating AirNow <inline-formula><mml:math id="M257" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> observations improves 1–24 <inline-formula><mml:math id="M258" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> forecast skill. Assimilating PurpleAir data alone yields modest improvements in MAE. Combining PurpleAir with AirNow observations provides additional benefit by slightly further reducing MAE relative to AirNow-only assimilation, indicating that PurpleAir observations nonetheless provide complementary information to AirNow. The AirNow data assimilation alone or with PurpleAir data generally show reduced MAE and RMSE across all EPA regions, whereas the largest reductions in MAE and RMSE are observed over regions affected by fire events and/or strongly influenced by transported smoke. The positive impact of PurpleAir data assimilation on smoke prediction during the September 2020 wildfires has also been demonstrated in an experimental Rapid Refresh Forecast System coupled with the Smoke and Dust Model (Wang et al., 2023), where it significantly reduced the model's 24 <inline-formula><mml:math id="M259" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">h</mml:mi></mml:mrow></mml:math></inline-formula> underprediction of surface <inline-formula><mml:math id="M260" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. Given that PurpleAir data coverage has improved since September 2020, the results of this study further highlight its potential to complement AirNow observations by filling spatial gaps and improving <inline-formula><mml:math id="M261" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> analysis and forecast skill.</p>
      <p id="d2e3968">In this initial development and evaluation of aerosol data assimilation in JEDI for AQMv7, the control variables are defined as individual forecast aerosol variables. In previous work on aerosol data assimilation for an earlier version of AQM using the GSI system (Wang et al., 2021), one option for the control variables was to define them as the total aerosol mass in each of the three modes, resulting in just three control variables. A control variable transform was then applied to partition the analysis increments across these modes to individual aerosol species, based on the ratio of each species' mass to the total mass within the corresponding mode.  The use of total aerosol mass in the three modes as control variables – thereby reducing the number of control variables from 70 to 3 – is planned for a future phase of development. The use of total masses as control variables also reduces the cost of the background error statistics calculation and iterative minimization (Kumar et al., 2019).</p>
      <p id="d2e3971">This study focused on surface-level <inline-formula><mml:math id="M262" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and did not incorporate vertical profile constraints with satellite-based aerosol optical depth (AOD) retrievals, which could further enhance forecast skill. A key challenge is the need for a robust forward operator in the CRTM AOD module – specifically, the creation and validation of lookup tables (LUTs) for AOD calculations with AQM. As an intermediate solution, existing LUTs in CRTM, such as the GEOS-5 LUTs, have been tested by grouping and mapping AQM aerosol species to those used in GEOS-5 (Wang et al., 2025). AOD assimilation also depends on an accurate vertical distribution of aerosols in the background field so that the CRTM AOD operator can provide meaningful gradient information at the correct vertical levels to constrain the analysis update. However, AQM models have shown deficiencies for the September 2020 fire events in representing smoke concentrations at and above plume rise levels, largely due to how fire emissions are injected into the model. This will be improved in the next update of the operational AQM.</p>
</sec>

      
      </body>
    <back><notes notes-type="codedataavailability"><title>Code and data availability</title>

      <p id="d2e3989">The AQMV7 model, JEDI software and <inline-formula><mml:math id="M263" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and fire emission data we used in this research are publicly available on on Zenodo (<ext-link xlink:href="https://doi.org/10.5281/zenodo.17049857" ext-link-type="DOI">10.5281/zenodo.17049857</ext-link>, Wang et al., 2025b). Users are referred to the guidance on compiling and running the model: (<uri>https://ufs-srweather-app.readthedocs.io/en/develop/UsersGuide/index.html</uri>, last access: 26 August 2025).  Global Forecast System analysis data were downloaded from the NCAR Research Data Archive: <ext-link xlink:href="https://doi.org/10.5065/D65D8PWK" ext-link-type="DOI">10.5065/D65D8PWK</ext-link> (DOC/NOAA/NWS/NCEP, 2015).</p>
  </notes><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e4017">HW designed and developed the <inline-formula><mml:math id="M264" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> DA capability within JEDI for the AQM model, conducted experiments, and evaluated performance; CM and JB contributed to <inline-formula><mml:math id="M265" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> DA methodology, advised on code implementation, and assisted in performance analysis; SW contributed to <inline-formula><mml:math id="M266" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> DA methodology and experimental design; RL conducted control experiments and contributed to workflow development; JL and KW contribute to model configuration and control run setup; YT contributed to background error modeling and observational error specification; HC, AT and HL contributed to workflow development; JL performed quality control and correction of PurpleAir observations.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e4056">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e4062">The scientific results and conclusions, as well as any views or opinions expressed herein, are those of the authors and do not necessarily reflect those of NOAA or the Department of Commerce.Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. The authors bear the ultimate responsibility for providing appropriate place names. Views expressed in the text are those of the authors and do not necessarily reflect the views of the publisher.</p>
  </notes><ack><title>Acknowledgements</title><p id="d2e4071">The authors sincerely thank Dr. Ming Hu and the three anonymous reviewers for their constructive comments and insightful suggestions, which significantly improved the quality and clarity of this manuscript. The authors also thank   Mohmmed Farooqui at Texas A&amp;M University-Kingsville for assisting with Python scripts to download the PurpleAir observations.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e4076">This research was supported by  the Fire Weather and Precipitation Research and Development in Support of the Disaster Relief Supplemental Appropriations Act (DRSA) project (NA23OAR4050200D), and in part by a NOAA Cooperative Agreement NA22OAR4320151 with the University of Colorado.</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e4082">This paper was edited by Narendra Ojha and reviewed by three anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bib1"><label>1</label><mixed-citation>Barkjohn, K. K., Gantt, B., and Clements, A. L.: Development and application of a United States-wide correction for <inline-formula><mml:math id="M267" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> data collected with the PurpleAir sensor, Atmos. Meas. Tech., 14, 4617–4637, <ext-link xlink:href="https://doi.org/10.5194/amt-14-4617-2021" ext-link-type="DOI">10.5194/amt-14-4617-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib2"><label>2</label><mixed-citation>Binkowski, F. S. and Roselle, S. J.: Models-3 Community Multiscale Air Quality (CMAQ) model aerosol component, 1, Model description, J. Geophys. Res.-Atmos., 108, 4183,  <ext-link xlink:href="https://doi.org/10.1029/2001JD001409" ext-link-type="DOI">10.1029/2001JD001409</ext-link>, 2003.</mixed-citation></ref>
      <ref id="bib1.bib3"><label>3</label><mixed-citation>Black, T. L., Abeles, J. A., Blake, B. T., Jovic, D., Rogers, E., Zhang, X., Aligo, E. A., Dawson, L. C., Lin, Y., Strobach, E., Shafran, P. C., and Carley, J. R.: A limited area modeling capability for the finite-volume cubed-sphere (FV3) dynamical core and comparison with a global two-way nest, J. Adv. Model. Earth Sy., 13, e2021MS002483,  <ext-link xlink:href="https://doi.org/10.1029/2021MS002483" ext-link-type="DOI">10.1029/2021MS002483</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib4"><label>4</label><mixed-citation>Chen, L., Mao, F., Hong, J., Zang, L., Chen, J., Zhang, Y., Gan, Y., Gong, W., and Xu, H.: Improving <inline-formula><mml:math id="M268" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> predictions during COVID-19 lockdown by assimilating multi-source observations and adjusting emissions, Environ. Pollut., 297, 118783, <ext-link xlink:href="https://doi.org/10.1016/j.envpol.2021.118783" ext-link-type="DOI">10.1016/j.envpol.2021.118783</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib5"><label>5</label><mixed-citation>Chen, X., Zhang, Y., Wang, K., Tong, D., Lee, P., Tang, Y., Huang, J., Campbell, P. C., Mcqueen, J., Pye, H. O. T., Murphy, B. N., and Kang, D.: Evaluation of the offline-coupled GFSv15–FV3–CMAQv5.0.2 in support of the next-generation National Air Quality Forecast Capability over the contiguous United States, Geosci. Model Dev., 14, 3969–3993, <ext-link xlink:href="https://doi.org/10.5194/gmd-14-3969-2021" ext-link-type="DOI">10.5194/gmd-14-3969-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib6"><label>6</label><mixed-citation> Cohen, A. J., Brauer, M., Burnett, R., Anderson, H. R., Frostad, J., Estep, K., Balakrishnan, K., Brunekreef, B., Dandona, L., Dandona, R., Feigin, V., Freedman, G., Hubbell, B., Jobling, A., Kan, H., Knibbs, L., Liu, Y., Martin, R., Morawska, L., Pope, C. A., Shin, H., Straif, K., Shaddick, G., Thomas, M., van Dingenen, R., van Donkelaar, A., Vos, T., Murray, C. J. L., and Forouzanfar, M. H.: Estimates and 25 year trends of the global burden of disease attributable to ambient air pollution: an analysis of data from the Global Burden of Diseases Study 2015, Lancet, 389, 1907–1918, 2017.</mixed-citation></ref>
      <ref id="bib1.bib7"><label>7</label><mixed-citation>Colette, A., Collin, G., Besson, F., Blot, E., Guidard, V., Meleux, F., Royer, A., Petiot, V., Miller, C., Fermond, O., Jeant, A., Adani, M., Arteta, J., Benedictow, A., Bergström, R., Bowdalo, D., Brandt, J., Briganti, G., Carvalho, A. C., Christensen, J. H., Couvidat, F., D'Elia, I., D'Isidoro, M., Denier van der Gon, H., Descombes, G., Di Tomaso, E., Douros, J., Escribano, J., Eskes, H., Fagerli, H., Fatahi, Y., Flemming, J., Friese, E., Frohn, L., Gauss, M., Geels, C., Guarnieri, G., Guevara, M., Guion, A., Guth, J., Hänninen, R., Hansen, K., Im, U., Janssen, R., Jeoffrion, M., Joly, M., Jones, L., Jorba, O., Kadantsev, E., Kahnert, M., Kaminski, J. W., Kouznetsov, R., Kranenburg, R., Kuenen, J., Lange, A. C., Langner, J., Lannuque, V., Macchia, F., Manders, A., Mircea, M., Nyiri, A., Olid, M., Pérez García-Pando, C., Palamarchuk, Y., Piersanti, A., Raux, B., Razinger, M., Robertson, L., Segers, A., Schaap, M., Siljamo, P., Simpson, D., Sofiev, M., Stangel, A., Struzewska, J., Tena, C., Timmermans, R., Tsikerdekis, T., Tsyro, S., Tyuryakov, S., Ung, A., Uppstu, A., Valdebenito, A., van Velthoven, P., Vitali, L., Ye, Z., Peuch, V.-H., and Rouïl, L.: Copernicus Atmosphere Monitoring Service – Regional Air Quality Production System v1.0, Geosci. Model Dev., 18, 6835–6883, <ext-link xlink:href="https://doi.org/10.5194/gmd-18-6835-2025" ext-link-type="DOI">10.5194/gmd-18-6835-2025</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bib8"><label>8</label><mixed-citation>Colmer, J., Hardman, I., Shimshack, J., and Voorheis, J.: Disparities in <inline-formula><mml:math id="M269" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> air pollution in the United States, Science, 369, 575–578, <ext-link xlink:href="https://doi.org/10.1126/science.aaz9353" ext-link-type="DOI">10.1126/science.aaz9353</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib9"><label>9</label><mixed-citation>Derber, J. C. and Rosati, A.: A global ocean data assimilation system, J. Phys. Oceanogr., 19, 1333–1347,   <uri>https://doi.org/10.1175/1520-0485(1989)019&lt;1333:AGODAS&gt;2.0.CO;2</uri>, 1989.</mixed-citation></ref>
      <ref id="bib1.bib10"><label>10</label><mixed-citation>DOC/NOAA/NWS/NCEP: National Centers for Environmental Prediction, National Weather Service, NOAA, U.S. Department of Commerce,   NCEP GFS 0.25 Degree Global Forecast Grids Historical Archive, NSF National Center for Atmospheric Research [data set], <ext-link xlink:href="https://doi.org/10.5065/D65D8PWK" ext-link-type="DOI">10.5065/D65D8PWK</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib11"><label>11</label><mixed-citation>Environmental Protection Agency: Technical Note on Reporting <inline-formula><mml:math id="M270" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> Continuous Monitoring and Speciation Data to the Air Quality System (AQS), <ext-link xlink:href="https://www.epa.gov/aqs/aqs-memos-technical-note-reporting-pm25-continuous-monitoring-and-speciation-data-air-quality">https://www.epa.gov/aqs/aqs-memos-technical-note-reporting-pm25-continuous-monitoring-and-speciation-data-air-quality</ext-link> (last access: 24 March  2026), 8 November 2006.</mixed-citation></ref>
      <ref id="bib1.bib12"><label>12</label><mixed-citation>EPA: Wildfire and Air Quality, US Environmental Protection Agency, <uri>https://www.epa.gov/sites/default/files/2018-08/documents/epa-2018-science_annualreport_508compressed.pdf</uri> (last access: 24 March 2026), 2017.</mixed-citation></ref>
      <ref id="bib1.bib13"><label>13</label><mixed-citation>Ha, S.: Implementation of aerosol data assimilation in WRFDA (v4.0.3) for WRF-Chem (v3.9.1) using the RACM/MADE-VBS scheme, Geosci. Model Dev., 15, 1769–1788, <ext-link xlink:href="https://doi.org/10.5194/gmd-15-1769-2022" ext-link-type="DOI">10.5194/gmd-15-1769-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib14"><label>14</label><mixed-citation>Hollingsworth, A. and Lönnberg, P.: The statistical structure of short-range forecast errors as determined from radiosonde data, Part I: The wind field, Tellus A, 38, 111–136, <ext-link xlink:href="https://doi.org/10.1111/j.1600-0870.1986.tb00460.x" ext-link-type="DOI">10.1111/j.1600-0870.1986.tb00460.x</ext-link>, 1986.</mixed-citation></ref>
      <ref id="bib1.bib15"><label>15</label><mixed-citation>Huang, B., Pagowski, M., Trahan, S., Martin, C. R., Tangborn, A., Kondragunta, S., and Kleist, D. T.: JEDI-based three-dimensional Ensemble-Variational Data Assimilation System for global aerosol forecasting at NCEP, J. Adv. Model. Earth Sy., 15, e2022MS003232,  <ext-link xlink:href="https://doi.org/10.1029/2022MS003232" ext-link-type="DOI">10.1029/2022MS003232</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib16"><label>16</label><mixed-citation>Huang, J., Stajner, I., Montuoro, R., Yang, F., Wang, K., Huang, H.-C., Jeon, C.-H., Curtis, B., McQueen, J., Liu, H., Baker, B., Tong, D., Tang, Y., Campbell, P., Grell, G., Frost, G., Schwantes, R., Wang, S., Kondragunta, S., Li, F., and Jung, Y.: Development of the next-generation air quality prediction system in the unified forecast system framework: enhancing predictability of wildfire air quality impacts, B. Am. Meteorol. Soc.,  <ext-link xlink:href="https://doi.org/10.1175/BAMS-D-23-0053.1" ext-link-type="DOI">10.1175/BAMS-D-23-0053.1</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bib17"><label>17</label><mixed-citation>Lee, S., Song, C. H., Han, K. M., Henze, D. K., Lee, K., Yu, J., Woo, J.-H., Jung, J., Choi, Y., Saide, P. E., and Carmichael, G. R.: Impacts of uncertainties in emissions on aerosol data assimilation and short-term <inline-formula><mml:math id="M271" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> predictions over Northeast Asia, Atmos. Environ., 271, 118921, <ext-link xlink:href="https://doi.org/10.1016/j.atmosenv.2021.118921" ext-link-type="DOI">10.1016/j.atmosenv.2021.118921</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib18"><label>18</label><mixed-citation>Li, Y., Tong, D., Ma, S., Zhang, X., Kondragunta, S., Li, F., and Saylor, R.: Dominance of wildfires impact on air quality exceedances during the 2020 record-breaking wildfire season in the United States, Geophys. Res. Lett., 48, e2021GL094908,  <ext-link xlink:href="https://doi.org/10.1029/2021GL094908" ext-link-type="DOI">10.1029/2021GL094908</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib19"><label>19</label><mixed-citation>Li, Z., Zang, Z., Li, Q. B., Chao, Y., Chen, D., Ye, Z., Liu, Y., and Liou, K. N.: A three-dimensional variational data assimilation system for multiple aerosol species with WRF/Chem and an application to <inline-formula><mml:math id="M272" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> prediction, Atmos. Chem. Phys., 13, 4265–4278, <ext-link xlink:href="https://doi.org/10.5194/acp-13-4265-2013" ext-link-type="DOI">10.5194/acp-13-4265-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib20"><label>20</label><mixed-citation>Liu, Z., Snyder, C., Guerrette, J. J., Jung, B.-J., Ban, J., Vahl, S., Wu, Y., Trémolet, Y., Auligné, T., Ménétrier, B., Shlyaeva, A., Herbener, S., Liu, E., Holdaway, D., and Johnson, B. T.: Data assimilation for the Model for Prediction Across Scales – Atmosphere with the Joint Effort for Data assimilation Integration (JEDI-MPAS 1.0.0): EnVar implementation and evaluation, Geosci. Model Dev., 15, 7859–7878, <ext-link xlink:href="https://doi.org/10.5194/gmd-15-7859-2022" ext-link-type="DOI">10.5194/gmd-15-7859-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib21"><label>21</label><mixed-citation>Kumar, R., Monache, L. D., Bresch, J., Saide, P. E., Tang, Y., Liu, Z., Silva, A. M. da, Alessandrini, S., Pfister, G., Edwards, D., Lee, P., and Djalalova, I.: Toward improving short-term predictions of fine particulate matter over the United States via assimilation of satellite aerosol optical depth retrievals, J. Geophys. Res.-Atmos., 124, 2753–2773,  <ext-link xlink:href="https://doi.org/10.1029/2018JD029009" ext-link-type="DOI">10.1029/2018JD029009</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib22"><label>22</label><mixed-citation>Mass, C. F., Ovens, D., Conrick, R., and Saltenberger, J.: The September 2020 wildfires over the Pacific Northwest, Weather Forecast., 36, 1843–1865,  <ext-link xlink:href="https://doi.org/10.1175/WAF-D-21-0028.1" ext-link-type="DOI">10.1175/WAF-D-21-0028.1</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib23"><label>23</label><mixed-citation>O'Dell, K., Ford, B., Fischer, E. V., and Pierce, J. R.: Contribution of wildland-fire smoke to US <inline-formula><mml:math id="M273" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and its influence on recent trends, Environ. Sci. Technol., 53, 1797–1804, <ext-link xlink:href="https://doi.org/10.1021/acs.est.8b05430" ext-link-type="DOI">10.1021/acs.est.8b05430</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib24"><label>24</label><mixed-citation>Pagowski, M., Grell, G. A., McKeen, S. A., Peckham, S. E., and Devenyi, D.: Three-dimensional variational data assimilation of ozone and fine particulate matter observations: some results using the Weather Research and Forecasting–Chemistry model and grid-point statistical interpolation, Q. J. Roy. Meteor. Soc., 136, 2013–2024, <ext-link xlink:href="https://doi.org/10.1002/qj.700" ext-link-type="DOI">10.1002/qj.700</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib25"><label>25</label><mixed-citation>Pagowski, M., Liu, Z., Grell, G. A., Hu, M., Lin, H.-C., and Schwartz, C. S.: Implementation of aerosol assimilation in Gridpoint Statistical Interpolation (v. 3.2) and WRF-Chem (v. 3.4.1), Geosci. Model Dev., 7, 1621–1627, <ext-link xlink:href="https://doi.org/10.5194/gmd-7-1621-2014" ext-link-type="DOI">10.5194/gmd-7-1621-2014</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib26"><label>26</label><mixed-citation>Park, S.-Y., Dash, U. K., Yu, J., Yumimoto, K., Uno, I., and Song, C. H.: Implementation of an ensemble Kalman filter in the Community Multiscale Air Quality model (CMAQ model v5.1) for data assimilation of ground-level <inline-formula><mml:math id="M274" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, Geosci. Model Dev., 15, 2773–2790, <ext-link xlink:href="https://doi.org/10.5194/gmd-15-2773-2022" ext-link-type="DOI">10.5194/gmd-15-2773-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib27"><label>27</label><mixed-citation>Robichaud, A.: Surface data assimilation of chemical compounds over North America and its impact on air quality and Air Quality Health Index (AQHI) forecasts, Air Qual. Atmos. Hlth., 10, 955–970,  <ext-link xlink:href="https://doi.org/10.1007/s11869-017-0485-9" ext-link-type="DOI">10.1007/s11869-017-0485-9</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib28"><label>28</label><mixed-citation>Robichaud, A., Ménard, R., Zaïtseva, Y., and Anselmo, D.: Multipollutant surface objective analyses and mapping of air quality health index over North America, Air Qual. Atmos. Hlth., 9, 743–759, <ext-link xlink:href="https://doi.org/10.1007/s11869-015-0385-9" ext-link-type="DOI">10.1007/s11869-015-0385-9</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib29"><label>29</label><mixed-citation>Schwartz, C. S., Liu, Z., Lin, H.-C., and McKeen, S. A.: Simultaneous three-dimensional variational assimilation of surface fine particulate matter and MODIS aerosol optical depth, J. Geophys. Res.-Atmos., 117,  <ext-link xlink:href="https://doi.org/10.1029/2011JD017383" ext-link-type="DOI">10.1029/2011JD017383</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bib30"><label>30</label><mixed-citation>Sluka, T.: Generic explicit diffusion operator added to JEDI, JCSDA Quarterly Newsletter, 74, <ext-link xlink:href="https://doi.org/10.25923/cfmw-2a05" ext-link-type="DOI">10.25923/cfmw-2a05</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib31"><label>31</label><mixed-citation>Sun, W., Liu, Z., Chen, D., Zhao, P., and Chen, M.: Development and application of the WRFDA-Chem three-dimensional variational (3DVAR) system: aiming to improve air quality forecasting and diagnose model deficiencies, Atmos. Chem. Phys., 20, 9311–9329, <ext-link xlink:href="https://doi.org/10.5194/acp-20-9311-2020" ext-link-type="DOI">10.5194/acp-20-9311-2020</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib32"><label>32</label><mixed-citation> Tang, Y., Martin, C. R., Huang, M., Chai, T., Pagowski, M., Wang, H., Kleist, D. T., Baker, B., Campbell, P. C., Huang, J., McQueen, J. T., Montuoro, R., Tong, D., Stajner, I., Jung, Y., Kumar, R., and Kondragunta, S.: Develop and evaluate JEDI-based regional aerosol data assimilation for NOAA UFS-AQM system, The 103rd AMS Annual Meeting, Denver, Colorado, 2023.</mixed-citation></ref>
      <ref id="bib1.bib33"><label>33</label><mixed-citation>Trémolet, Y. and Auligné, T.: The Joint Effort for Data Assimilation Integration (JEDI), JCSDA Quarterly Newsletter, 66, 1–5, <ext-link xlink:href="https://doi.org/10.25923/RB19-0Q26" ext-link-type="DOI">10.25923/RB19-0Q26</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib34"><label>34</label><mixed-citation>Vogel, A., Ménard, R., Abu, J., and Chen, J.: Towards a parametric Kalman filter for operational wildfire plume assimilation: Formulation of the forecast step, EGUsphere [preprint], <ext-link xlink:href="https://doi.org/10.5194/egusphere-2025-6386" ext-link-type="DOI">10.5194/egusphere-2025-6386</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bib35"><label>35</label><mixed-citation>Wang, H., Weygandt, S., Pagowski, M., Li, R., Montuoro, R., Liu, Q., Dang, C., Ma, Y., Kumar, R., Kondragunta, S., Martin, C., Huang, J., McQueen, J., Stajner, I., and Hughes, B.: Assimilation of aerosol optical depth (AOD) retrievals and <inline-formula><mml:math id="M275" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> in NCEP's next-generation regional air quality forecasting system, WCRP-WWRP Symposium on Data Assimilation and Reanalysis, 2021.</mixed-citation></ref>
      <ref id="bib1.bib36"><label>36</label><mixed-citation>Wang, H., Weygandt, S., Ahmadov, R., Li, R., Romero-Alvarez, J., Li, H., Grell, G., Pagowski, M., Tang, Y., Martin, C., McQueen, J., and Farooqui, M.: Assimilation of surface particulate matter observations in the experimental Rapid Refresh Forecast System coupled with smoke and dust model, CU/CIRES Rendezvous 2023, Boulder, Colorado, <uri>https://insidecires.colorado.edu/rendezvous/uploads/Rendezvous_2023_7732_1683821981.pdf</uri> (last access: 13 March 2026), 2023.</mixed-citation></ref>
      <ref id="bib1.bib37"><label>37</label><mixed-citation> Wang, H., Martin, C. R., Barré, J. E., Li, R., Allen, B., Luo, H., Weygandt, S. S., Hu, M., Ahmadov, R., Huang, J., Tang, Y., Choi, H., Tangborn, A., Wang, K., Liu, H., Stajner, I., Dang, C., Kondragunta, S., and Kumar, R.: Aerosol data assimilation within JEDI for NOAA's regional air quality model (AQM), The 105th Annual Meeting of the American Meteorological Society, New Orleans, Louisiana, 2025a.</mixed-citation></ref>
      <ref id="bib1.bib38"><label>38</label><mixed-citation>Wang, H., Martin, C., Barré, J., Li, R., Weygandt, S., Huang, J., Tang, Y., Choi, H., Wang, K., Liu, H., and Lee, J.: <inline-formula><mml:math id="M276" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> assimilation within JEDI for NOAA's regional air quality model (AQMv7): application to the September 2020 western US wildfires, Zenodo [data set], <ext-link xlink:href="https://doi.org/10.5281/zenodo.17049857" ext-link-type="DOI">10.5281/zenodo.17049857</ext-link>, 2025b.</mixed-citation></ref>
      <ref id="bib1.bib39"><label>39</label><mixed-citation>Wei, Y., Zhao, X., Zhang, Z., Xu, J., Cheng, S., Liu, Z., Sun, W., Chen, X., Wang, Z., Hao, X., Li, J., and Chen, D.: Impact of model resolution and its representativeness consistency with observations on operational prediction of <inline-formula><mml:math id="M277" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> with 3D-VAR data assimilation, Atmos. Pollut. Res., 15, 102141, <ext-link xlink:href="https://doi.org/10.1016/j.apr.2024.102141" ext-link-type="DOI">10.1016/j.apr.2024.102141</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib40"><label>40</label><mixed-citation>Wen, J. and Burke, M.: Wildfire smoke plume segmentation using geostationary satellite imagery, arXiv, <ext-link xlink:href="https://doi.org/10.48550/arXiv.2109.01637" ext-link-type="DOI">10.48550/arXiv.2109.01637</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib41"><label>41</label><mixed-citation>Wu, J.-B., Xu, J., Pagowski, M., Geng, F., Gu, S., Zhou, G., Xie, Y., and Yu, Z.: Modeling study of a severe aerosol pollution event in December 2013 over Shanghai, China: An application of chemical data assimilation, Particuology, 2015, <ext-link xlink:href="https://doi.org/10.1016/j.partic.2014.10.008" ext-link-type="DOI">10.1016/j.partic.2014.10.008</ext-link>, 2015. </mixed-citation></ref>
      <ref id="bib1.bib42"><label>42</label><mixed-citation>White, S. R., Sugrue, R. A., Guillotte, L., James, E., Wang, H., Ahmadov, R., Thakur, N., and Chow, F. K.: Hourly <inline-formula><mml:math id="M278" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">PM</mml:mi><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> estimates across California from 2018 to 2023, ACS ES&amp;T Air, <ext-link xlink:href="https://doi.org/10.1021/acsestair.5c00372" ext-link-type="DOI">10.1021/acsestair.5c00372</ext-link>, 2026.</mixed-citation></ref>
      <ref id="bib1.bib43"><label>43</label><mixed-citation>Zhang, H., Yee, L. D., Lee, B. H., Curtis, M. P., Worton, D. R., Isaacman-VanWertz, G., Offenberg, J. H., Lewandowski, M., Kleindienst, T. E., Beaver, M. R., Holder, A. L., Lonneman, W. A., Docherty, K. S., Jaoui, M., Pye, H. O. T., Hu, W., Day, D. A., Campuzano-Jost, P., Jimenez, J. L., Guo, H., Weber, R. J., de Gouw, J., Koss, A. R., Edgerton, E. S., Brune, W., Mohr, C., Lopez-Hilfiker, F. D., Lutz, A., Kreisberg, N. M., Spielman, S. R., Hering, S. V., Wilson, K. R., Thornton, J. A., and Goldstein, A. H.: Monoterpenes are the largest source of summertime organic aerosol in the southeastern United States, P. Natl. Acad. Sci. USA, 115, 2038–2043,  <ext-link xlink:href="https://doi.org/10.1073/pnas.1717513115" ext-link-type="DOI">10.1073/pnas.1717513115</ext-link>, 2018.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>PM<sub>2.5</sub> assimilation within JEDI for NOAA's regional Air Quality Model (AQMv7): application to the September 2020 Western US wildfires</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>1</label><mixed-citation>
       Barkjohn, K. K., Gantt, B., and Clements, A. L.: Development and application of a United States-wide correction for PM<sub>2.5</sub> data collected with the PurpleAir sensor, Atmos. Meas. Tech., 14, 4617–4637, <a href="https://doi.org/10.5194/amt-14-4617-2021" target="_blank">https://doi.org/10.5194/amt-14-4617-2021</a>, 2021. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>2</label><mixed-citation>
       Binkowski, F. S. and Roselle, S. J.: Models-3 Community Multiscale Air Quality (CMAQ) model aerosol component, 1, Model description, J. Geophys. Res.-Atmos., 108, 4183,  <a href="https://doi.org/10.1029/2001JD001409" target="_blank">https://doi.org/10.1029/2001JD001409</a>, 2003.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>3</label><mixed-citation>
       Black, T. L., Abeles, J. A., Blake, B. T., Jovic, D., Rogers, E., Zhang, X., Aligo, E. A., Dawson, L. C., Lin, Y., Strobach, E., Shafran, P. C., and Carley, J. R.: A limited area modeling capability for the finite-volume cubed-sphere (FV3) dynamical core and comparison with a global two-way nest, J. Adv. Model. Earth Sy., 13, e2021MS002483,  <a href="https://doi.org/10.1029/2021MS002483" target="_blank">https://doi.org/10.1029/2021MS002483</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>4</label><mixed-citation>
       Chen, L., Mao, F., Hong, J., Zang, L., Chen, J., Zhang, Y., Gan, Y., Gong, W., and Xu, H.: Improving PM<sub>2.5</sub> predictions during COVID-19 lockdown by assimilating multi-source observations and adjusting emissions, Environ. Pollut., 297, 118783, <a href="https://doi.org/10.1016/j.envpol.2021.118783" target="_blank">https://doi.org/10.1016/j.envpol.2021.118783</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>5</label><mixed-citation>
       Chen, X., Zhang, Y., Wang, K., Tong, D., Lee, P., Tang, Y., Huang, J., Campbell, P. C., Mcqueen, J., Pye, H. O. T., Murphy, B. N., and Kang, D.: Evaluation of the offline-coupled GFSv15–FV3–CMAQv5.0.2 in support of the next-generation National Air Quality Forecast Capability over the contiguous United States, Geosci. Model Dev., 14, 3969–3993, <a href="https://doi.org/10.5194/gmd-14-3969-2021" target="_blank">https://doi.org/10.5194/gmd-14-3969-2021</a>, 2021. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>6</label><mixed-citation>
       Cohen, A. J., Brauer, M., Burnett, R., Anderson, H. R., Frostad, J., Estep, K., Balakrishnan, K., Brunekreef, B., Dandona, L., Dandona, R., Feigin, V., Freedman, G., Hubbell, B., Jobling, A., Kan, H., Knibbs, L., Liu, Y., Martin, R., Morawska, L., Pope, C. A., Shin, H., Straif, K., Shaddick, G., Thomas, M., van Dingenen, R., van Donkelaar, A., Vos, T., Murray, C. J. L., and Forouzanfar, M. H.: Estimates and 25 year trends of the global burden of disease attributable to ambient air pollution: an analysis of data from the Global Burden of Diseases Study 2015, Lancet, 389, 1907–1918, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>7</label><mixed-citation>
       Colette, A., Collin, G., Besson, F., Blot, E., Guidard, V., Meleux, F., Royer, A., Petiot, V., Miller, C., Fermond, O., Jeant, A., Adani, M., Arteta, J., Benedictow, A., Bergström, R., Bowdalo, D., Brandt, J., Briganti, G., Carvalho, A. C., Christensen, J. H., Couvidat, F., D'Elia, I., D'Isidoro, M., Denier van der Gon, H., Descombes, G., Di Tomaso, E., Douros, J., Escribano, J., Eskes, H., Fagerli, H., Fatahi, Y., Flemming, J., Friese, E., Frohn, L., Gauss, M., Geels, C., Guarnieri, G., Guevara, M., Guion, A., Guth, J., Hänninen, R., Hansen, K., Im, U., Janssen, R., Jeoffrion, M., Joly, M., Jones, L., Jorba, O., Kadantsev, E., Kahnert, M., Kaminski, J. W., Kouznetsov, R., Kranenburg, R., Kuenen, J., Lange, A. C., Langner, J., Lannuque, V., Macchia, F., Manders, A., Mircea, M., Nyiri, A., Olid, M., Pérez García-Pando, C., Palamarchuk, Y., Piersanti, A., Raux, B., Razinger, M., Robertson, L., Segers, A., Schaap, M., Siljamo, P., Simpson, D., Sofiev, M., Stangel, A., Struzewska, J., Tena, C., Timmermans, R., Tsikerdekis, T., Tsyro, S., Tyuryakov, S., Ung, A., Uppstu, A., Valdebenito, A., van Velthoven, P., Vitali, L., Ye, Z., Peuch, V.-H., and Rouïl, L.: Copernicus Atmosphere Monitoring Service – Regional Air Quality Production System v1.0, Geosci. Model Dev., 18, 6835–6883, <a href="https://doi.org/10.5194/gmd-18-6835-2025" target="_blank">https://doi.org/10.5194/gmd-18-6835-2025</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>8</label><mixed-citation>
       Colmer, J., Hardman, I., Shimshack, J., and Voorheis, J.: Disparities in PM<sub>2.5</sub> air pollution in the United States, Science, 369, 575–578, <a href="https://doi.org/10.1126/science.aaz9353" target="_blank">https://doi.org/10.1126/science.aaz9353</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>9</label><mixed-citation>
       Derber, J. C. and Rosati, A.: A global ocean data assimilation system, J. Phys. Oceanogr., 19, 1333–1347,   <a href="https://doi.org/10.1175/1520-0485(1989)019&lt;1333:AGODAS&gt;2.0.CO;2" target="_blank"/>, 1989.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>10</label><mixed-citation>
      
DOC/NOAA/NWS/NCEP: National Centers for Environmental Prediction, National Weather Service, NOAA, U.S. Department of Commerce,   NCEP GFS 0.25 Degree Global Forecast Grids Historical Archive, NSF National Center for Atmospheric Research [data set], <a href="https://doi.org/10.5065/D65D8PWK" target="_blank">https://doi.org/10.5065/D65D8PWK</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>11</label><mixed-citation>
       Environmental Protection Agency: Technical Note on Reporting PM<sub>2.5</sub> Continuous Monitoring and Speciation Data to the Air Quality System (AQS), <a href="https://www.epa.gov/aqs/aqs-memos-technical-note-reporting-pm25-continuous-monitoring-and-speciation-data-air-quality" target="_blank">https://www.epa.gov/aqs/aqs-memos-technical-note-reporting-pm25-continuous-monitoring-and-speciation-data-air-quality</a> (last access: 24 March  2026), 8 November 2006.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>12</label><mixed-citation>
       EPA: Wildfire and Air Quality, US Environmental Protection Agency, <a href="https://www.epa.gov/sites/default/files/2018-08/documents/epa-2018-science_annualreport_508compressed.pdf" target="_blank"/> (last access: 24 March 2026), 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>13</label><mixed-citation>
       Ha, S.: Implementation of aerosol data assimilation in WRFDA (v4.0.3) for WRF-Chem (v3.9.1) using the RACM/MADE-VBS scheme, Geosci. Model Dev., 15, 1769–1788, <a href="https://doi.org/10.5194/gmd-15-1769-2022" target="_blank">https://doi.org/10.5194/gmd-15-1769-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>14</label><mixed-citation>
       Hollingsworth, A. and Lönnberg, P.: The statistical structure of short-range forecast errors as determined from radiosonde data, Part I: The wind field, Tellus A, 38, 111–136, <a href="https://doi.org/10.1111/j.1600-0870.1986.tb00460.x" target="_blank">https://doi.org/10.1111/j.1600-0870.1986.tb00460.x</a>, 1986.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>15</label><mixed-citation>
       Huang, B., Pagowski, M., Trahan, S., Martin, C. R., Tangborn, A., Kondragunta, S., and Kleist, D. T.: JEDI-based three-dimensional Ensemble-Variational Data Assimilation System for global aerosol forecasting at NCEP, J. Adv. Model. Earth Sy., 15, e2022MS003232,  <a href="https://doi.org/10.1029/2022MS003232" target="_blank">https://doi.org/10.1029/2022MS003232</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>16</label><mixed-citation>
       Huang, J., Stajner, I., Montuoro, R., Yang, F., Wang, K., Huang, H.-C., Jeon, C.-H., Curtis, B., McQueen, J., Liu, H., Baker, B., Tong, D., Tang, Y., Campbell, P., Grell, G., Frost, G., Schwantes, R., Wang, S., Kondragunta, S., Li, F., and Jung, Y.: Development of the next-generation air quality prediction system in the unified forecast system framework: enhancing predictability of wildfire air quality impacts, B. Am. Meteorol. Soc.,  <a href="https://doi.org/10.1175/BAMS-D-23-0053.1" target="_blank">https://doi.org/10.1175/BAMS-D-23-0053.1</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>17</label><mixed-citation>
       Lee, S., Song, C. H., Han, K. M., Henze, D. K., Lee, K., Yu, J., Woo, J.-H., Jung, J., Choi, Y., Saide, P. E., and Carmichael, G. R.: Impacts of uncertainties in emissions on aerosol data assimilation and short-term PM<sub>2.5</sub> predictions over Northeast Asia, Atmos. Environ., 271, 118921, <a href="https://doi.org/10.1016/j.atmosenv.2021.118921" target="_blank">https://doi.org/10.1016/j.atmosenv.2021.118921</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>18</label><mixed-citation>
       Li, Y., Tong, D., Ma, S., Zhang, X., Kondragunta, S., Li, F., and Saylor, R.: Dominance of wildfires impact on air quality exceedances during the 2020 record-breaking wildfire season in the United States, Geophys. Res. Lett., 48, e2021GL094908,  <a href="https://doi.org/10.1029/2021GL094908" target="_blank">https://doi.org/10.1029/2021GL094908</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>19</label><mixed-citation>
       Li, Z., Zang, Z., Li, Q. B., Chao, Y., Chen, D., Ye, Z., Liu, Y., and Liou, K. N.: A three-dimensional variational data assimilation system for multiple aerosol species with WRF/Chem and an application to PM<sub>2.5</sub> prediction, Atmos. Chem. Phys., 13, 4265–4278, <a href="https://doi.org/10.5194/acp-13-4265-2013" target="_blank">https://doi.org/10.5194/acp-13-4265-2013</a>, 2013. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>20</label><mixed-citation>
       Liu, Z., Snyder, C., Guerrette, J. J., Jung, B.-J., Ban, J., Vahl, S., Wu, Y., Trémolet, Y., Auligné, T., Ménétrier, B., Shlyaeva, A., Herbener, S., Liu, E., Holdaway, D., and Johnson, B. T.: Data assimilation for the Model for Prediction Across Scales – Atmosphere with the Joint Effort for Data assimilation Integration (JEDI-MPAS 1.0.0): EnVar implementation and evaluation, Geosci. Model Dev., 15, 7859–7878, <a href="https://doi.org/10.5194/gmd-15-7859-2022" target="_blank">https://doi.org/10.5194/gmd-15-7859-2022</a>, 2022. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>21</label><mixed-citation>
       Kumar, R., Monache, L. D., Bresch, J., Saide, P. E., Tang, Y., Liu, Z., Silva, A. M. da, Alessandrini, S., Pfister, G., Edwards, D., Lee, P., and Djalalova, I.: Toward improving short-term predictions of fine particulate matter over the United States via assimilation of satellite aerosol optical depth retrievals, J. Geophys. Res.-Atmos., 124, 2753–2773,  <a href="https://doi.org/10.1029/2018JD029009" target="_blank">https://doi.org/10.1029/2018JD029009</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>22</label><mixed-citation>
       Mass, C. F., Ovens, D., Conrick, R., and Saltenberger, J.: The September 2020 wildfires over the Pacific Northwest, Weather Forecast., 36, 1843–1865,  <a href="https://doi.org/10.1175/WAF-D-21-0028.1" target="_blank">https://doi.org/10.1175/WAF-D-21-0028.1</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>23</label><mixed-citation>
       O'Dell, K., Ford, B., Fischer, E. V., and Pierce, J. R.: Contribution of wildland-fire smoke to US PM<sub>2.5</sub> and its influence on recent trends, Environ. Sci. Technol., 53, 1797–1804, <a href="https://doi.org/10.1021/acs.est.8b05430" target="_blank">https://doi.org/10.1021/acs.est.8b05430</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>24</label><mixed-citation>
       Pagowski, M., Grell, G. A., McKeen, S. A., Peckham, S. E., and Devenyi, D.: Three-dimensional variational data assimilation of ozone and fine particulate matter observations: some results using the Weather Research and Forecasting–Chemistry model and grid-point statistical interpolation, Q. J. Roy. Meteor. Soc., 136, 2013–2024, <a href="https://doi.org/10.1002/qj.700" target="_blank">https://doi.org/10.1002/qj.700</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>25</label><mixed-citation>
       Pagowski, M., Liu, Z., Grell, G. A., Hu, M., Lin, H.-C., and Schwartz, C. S.: Implementation of aerosol assimilation in Gridpoint Statistical Interpolation (v. 3.2) and WRF-Chem (v. 3.4.1), Geosci. Model Dev., 7, 1621–1627, <a href="https://doi.org/10.5194/gmd-7-1621-2014" target="_blank">https://doi.org/10.5194/gmd-7-1621-2014</a>, 2014. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>26</label><mixed-citation>
       Park, S.-Y., Dash, U. K., Yu, J., Yumimoto, K., Uno, I., and Song, C. H.: Implementation of an ensemble Kalman filter in the Community Multiscale Air Quality model (CMAQ model v5.1) for data assimilation of ground-level PM<sub>2.5</sub>, Geosci. Model Dev., 15, 2773–2790, <a href="https://doi.org/10.5194/gmd-15-2773-2022" target="_blank">https://doi.org/10.5194/gmd-15-2773-2022</a>, 2022. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>27</label><mixed-citation>
       Robichaud, A.: Surface data assimilation of chemical compounds over North America and its impact on air quality and Air Quality Health Index (AQHI) forecasts, Air Qual. Atmos. Hlth., 10, 955–970,  <a href="https://doi.org/10.1007/s11869-017-0485-9" target="_blank">https://doi.org/10.1007/s11869-017-0485-9</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>28</label><mixed-citation>
       Robichaud, A., Ménard, R., Zaïtseva, Y., and Anselmo, D.: Multipollutant surface objective analyses and mapping of air quality health index over North America, Air Qual. Atmos. Hlth., 9, 743–759, <a href="https://doi.org/10.1007/s11869-015-0385-9" target="_blank">https://doi.org/10.1007/s11869-015-0385-9</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>29</label><mixed-citation>
       Schwartz, C. S., Liu, Z., Lin, H.-C., and McKeen, S. A.: Simultaneous three-dimensional variational assimilation of surface fine particulate matter and MODIS aerosol optical depth, J. Geophys. Res.-Atmos., 117,  <a href="https://doi.org/10.1029/2011JD017383" target="_blank">https://doi.org/10.1029/2011JD017383</a>, 2012.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>30</label><mixed-citation>
       Sluka, T.: Generic explicit diffusion operator added to JEDI, JCSDA Quarterly Newsletter, 74, <a href="https://doi.org/10.25923/cfmw-2a05" target="_blank">https://doi.org/10.25923/cfmw-2a05</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>31</label><mixed-citation>
       Sun, W., Liu, Z., Chen, D., Zhao, P., and Chen, M.: Development and application of the WRFDA-Chem three-dimensional variational (3DVAR) system: aiming to improve air quality forecasting and diagnose model deficiencies, Atmos. Chem. Phys., 20, 9311–9329, <a href="https://doi.org/10.5194/acp-20-9311-2020" target="_blank">https://doi.org/10.5194/acp-20-9311-2020</a>, 2020. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>32</label><mixed-citation>
       Tang, Y., Martin, C. R., Huang, M., Chai, T., Pagowski, M., Wang, H., Kleist, D. T., Baker, B., Campbell, P. C., Huang, J., McQueen, J. T., Montuoro, R., Tong, D., Stajner, I., Jung, Y., Kumar, R., and Kondragunta, S.: Develop and evaluate JEDI-based regional aerosol data assimilation for NOAA UFS-AQM system, The 103rd AMS Annual Meeting, Denver, Colorado, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>33</label><mixed-citation>
       Trémolet, Y. and Auligné, T.: The Joint Effort for Data Assimilation Integration (JEDI), JCSDA Quarterly Newsletter, 66, 1–5, <a href="https://doi.org/10.25923/RB19-0Q26" target="_blank">https://doi.org/10.25923/RB19-0Q26</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>34</label><mixed-citation>
       Vogel, A., Ménard, R., Abu, J., and Chen, J.: Towards a parametric Kalman filter for operational wildfire plume assimilation: Formulation of the forecast step, EGUsphere [preprint], <a href="https://doi.org/10.5194/egusphere-2025-6386" target="_blank">https://doi.org/10.5194/egusphere-2025-6386</a>, 2025. 
    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>35</label><mixed-citation>
       Wang, H., Weygandt, S., Pagowski, M., Li, R., Montuoro, R., Liu, Q., Dang, C., Ma, Y., Kumar, R., Kondragunta, S., Martin, C., Huang, J., McQueen, J., Stajner, I., and Hughes, B.: Assimilation of aerosol optical depth (AOD) retrievals and PM<sub>2.5</sub> in NCEP's next-generation regional air quality forecasting system, WCRP-WWRP Symposium on Data Assimilation and Reanalysis, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>36</label><mixed-citation>
       Wang, H., Weygandt, S., Ahmadov, R., Li, R., Romero-Alvarez, J., Li, H., Grell, G., Pagowski, M., Tang, Y., Martin, C., McQueen, J., and Farooqui, M.: Assimilation of surface particulate matter observations in the experimental Rapid Refresh Forecast System coupled with smoke and dust model, CU/CIRES Rendezvous 2023, Boulder, Colorado, <a href="https://insidecires.colorado.edu/rendezvous/uploads/Rendezvous_2023_7732_1683821981.pdf" target="_blank"/> (last access: 13 March 2026), 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>37</label><mixed-citation>
       Wang, H., Martin, C. R., Barré, J. E., Li, R., Allen, B., Luo, H., Weygandt, S. S., Hu, M., Ahmadov, R., Huang, J., Tang, Y., Choi, H., Tangborn, A., Wang, K., Liu, H., Stajner, I., Dang, C., Kondragunta, S., and Kumar, R.: Aerosol data assimilation within JEDI for NOAA's regional air quality model (AQM), The 105th Annual Meeting of the American Meteorological Society, New Orleans, Louisiana, 2025a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>38</label><mixed-citation>
       Wang, H., Martin, C., Barré, J., Li, R., Weygandt, S., Huang, J., Tang, Y., Choi, H., Wang, K., Liu, H., and Lee, J.: PM<sub>2.5</sub> assimilation within JEDI for NOAA's regional air quality model (AQMv7): application to the September 2020 western US wildfires, Zenodo [data set], <a href="https://doi.org/10.5281/zenodo.17049857" target="_blank">https://doi.org/10.5281/zenodo.17049857</a>, 2025b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>39</label><mixed-citation>
       Wei, Y., Zhao, X., Zhang, Z., Xu, J., Cheng, S., Liu, Z., Sun, W., Chen, X., Wang, Z., Hao, X., Li, J., and Chen, D.: Impact of model resolution and its representativeness consistency with observations on operational prediction of PM<sub>2.5</sub> with 3D-VAR data assimilation, Atmos. Pollut. Res., 15, 102141, <a href="https://doi.org/10.1016/j.apr.2024.102141" target="_blank">https://doi.org/10.1016/j.apr.2024.102141</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>40</label><mixed-citation>
       Wen, J. and Burke, M.: Wildfire smoke plume segmentation using geostationary satellite imagery, arXiv, <a href="https://doi.org/10.48550/arXiv.2109.01637" target="_blank">https://doi.org/10.48550/arXiv.2109.01637</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>41</label><mixed-citation>
      
Wu, J.-B., Xu, J., Pagowski, M., Geng, F., Gu, S., Zhou, G., Xie, Y., and Yu, Z.: Modeling study of a severe aerosol pollution event in December 2013 over Shanghai, China: An application of chemical data assimilation, Particuology, 2015, <a href="https://doi.org/10.1016/j.partic.2014.10.008" target="_blank">https://doi.org/10.1016/j.partic.2014.10.008</a>, 2015.


    </mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>42</label><mixed-citation>
       White, S. R., Sugrue, R. A., Guillotte, L., James, E., Wang, H., Ahmadov, R., Thakur, N., and Chow, F. K.: Hourly PM<sub>2.5</sub> estimates across California from 2018 to 2023, ACS ES&amp;T Air, <a href="https://doi.org/10.1021/acsestair.5c00372" target="_blank">https://doi.org/10.1021/acsestair.5c00372</a>, 2026.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>43</label><mixed-citation>
       Zhang, H., Yee, L. D., Lee, B. H., Curtis, M. P., Worton, D. R., Isaacman-VanWertz, G., Offenberg, J. H., Lewandowski, M., Kleindienst, T. E., Beaver, M. R., Holder, A. L., Lonneman, W. A., Docherty, K. S., Jaoui, M., Pye, H. O. T., Hu, W., Day, D. A., Campuzano-Jost, P., Jimenez, J. L., Guo, H., Weber, R. J., de Gouw, J., Koss, A. R., Edgerton, E. S., Brune, W., Mohr, C., Lopez-Hilfiker, F. D., Lutz, A., Kreisberg, N. M., Spielman, S. R., Hering, S. V., Wilson, K. R., Thornton, J. A., and Goldstein, A. H.: Monoterpenes are the largest source of summertime organic aerosol in the southeastern United States, P. Natl. Acad. Sci. USA, 115, 2038–2043,  <a href="https://doi.org/10.1073/pnas.1717513115" target="_blank">https://doi.org/10.1073/pnas.1717513115</a>, 2018.

    </mixed-citation></ref-html>--></article>
