<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="research-article">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">GMD</journal-id><journal-title-group>
    <journal-title>Geoscientific Model Development</journal-title>
    <abbrev-journal-title abbrev-type="publisher">GMD</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Geosci. Model Dev.</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1991-9603</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/gmd-19-2691-2026</article-id><title-group><article-title>Machine learning-driven characterization and prescription  of aerosol optical properties for atmospheric models</article-title><alt-title>Machine learning-driven characterization and prescription of aerosol optical properties</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes" rid="aff1">
          <name><surname>do Rosário</surname><given-names>Nilton Évora</given-names></name>
          <email>nrosario@unifesp.br</email>
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Longo</surname><given-names>Karla M.</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Toso</surname><given-names>Pedro H.</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Freitas</surname><given-names>Saulo R.</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-9879-646X</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3">
          <name><surname>Yamasoe</surname><given-names>Marcia A.</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-3066-9146</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Rodrigues</surname><given-names>Luiz Flávio</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Medeiros</surname><given-names>Otavio</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Velho</surname><given-names>Haroldo Campos</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4">
          <name><surname>Menezes</surname><given-names>Isilda da Cunha</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-1111-5228</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4">
          <name><surname>Miranda</surname><given-names>Ana Isabel</given-names></name>
          
        </contrib>
        <aff id="aff1"><label>1</label><institution>Departamento de Ciências Ambientais, Universidade Federal de São Paulo, Diadema, SP, Brazil</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>Instituto Nacional de Pesquisas Espaciais (INPE), São José dos Campos, SP, Brazil</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>Departamento de Ciências Atmosféricas, Instituto de Astronomia, Geofísica e Ciências Atmosféricas,  Universidade de São Paulo, Cidade Universitária, São Paulo, SP, Brazil</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>Center for Environmental and Marine Studies (CESAM), Department of Environment and Planning,  University of Aveiro, Campus Universitário de Santiago, 3810-193 Aveiro, Portugal</institution>
        </aff>
      </contrib-group>
      <author-notes><corresp id="corr1">Nilton Évora do Rosário (nrosario@unifesp.br)</corresp></author-notes><pub-date><day>10</day><month>April</month><year>2026</year></pub-date>
      
      <volume>19</volume>
      <issue>7</issue>
      <fpage>2691</fpage><lpage>2716</lpage>
      <history>
        <date date-type="received"><day>30</day><month>January</month><year>2025</year></date>
           <date date-type="rev-request"><day>16</day><month>April</month><year>2025</year></date>
           <date date-type="rev-recd"><day>5</day><month>March</month><year>2026</year></date>
           <date date-type="accepted"><day>17</day><month>March</month><year>2026</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 Nilton Évora do Rosário et al.</copyright-statement>
        <copyright-year>2026</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026.html">This article is available from https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026.html</self-uri><self-uri xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026.pdf">The full text article is available as a PDF file from https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e190">Accurate modeling of aerosol optical properties is critical to simulate aerosol radiative effects. However, uncertainties regarding the simulation of aerosol-intensive optical properties are still significant. Therefore, the use of observations to constrain aerosol optical properties in models has been indicated as an option. Also, explicit computations of optical properties are still too costly for operational models, which makes observation-based prescriptions a convenient solution. We developed an observation-based prescription of aerosol optical properties driven by machine-learning techniques that can be applied in models. The Iberian Peninsula (IP) was taken as the reference domain, and the aerosol products from the AERONET sites across the IP were the main dataset. First, clustering was applied to define the typical aerosol optical regimes affecting the IP atmosphere. Five typical regimes were identified. Two of them were dominated by coarse mode, which was associated with Saharan dust. One was found to be close to pure dust, while the other indicated a mixed scenario of dust and pollution. Two of the non-dust regimes, strongly and moderately absorbing, were found to be associated with smoke. The remaining non-dust regime, with no clear association, occurs mostly in the eastern portion of the IP. Afterward, using aerosol-type columnar mass density from MERRA-2, a model was trained as a predictor of the optical regimes using the Random Forest method. The model was tested under distinct aerosol scenarios. Predictions' accuracy ranged from 60 % to 75 %, depending on the regime, while presenting an average accuracy of 70 %.</p>
  </abstract>
    
<funding-group>
<award-group id="gs1">
<funding-source>Fundação para a Ciência e a Tecnologia</funding-source>
<award-id>10.54499/PTDC/CTA-MET/3392/2020</award-id>
<award-id>10.54499/2023.17415.ICDT</award-id>
</award-group>
<award-group id="gs2">
<funding-source>Fundação para a Ciência e a Tecnologia</funding-source>
<award-id>10.54499/UID/50017/2025</award-id>
<award-id>10.54499/LA/P/0094/2020</award-id>
</award-group>
<award-group id="gs3">
<funding-source>Conselho Nacional de Desenvolvimento Científico e Tecnológico</funding-source>
<award-id>441851/2023-1</award-id>
<award-id>172486/2023-8</award-id>
<award-id>315349/2023-9</award-id>
</award-group>
</funding-group>
</article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e202">The importance of aerosols in the Earth's climate system is undisputed. Aerosol particles participate directly in the planetary energy budgets via the scattering and absorption of terrestrial and solar radiation (Kim and Ramanathan, 2008; IPCC, 2021; Li et al., 2022). However, this participation is permeated by high complexity due to the variety of aerosol particles sizes and composition, which cause significant uncertainty (Spencer et al., 2019; IPCC, 2021; Li et al., 2022). The uncertainties and challenges in accurately representing aerosol particles' processes in climate, weather, and environmental models arise from various limitations. For instance, when it comes to aerosol direct interaction with radiation, the current global aerosol monitoring system does not provide a comprehensive spatial-temporal characterization of spectral complex refractive index and size distribution of the aerosol particles, critical information to characterize the particle absorption and scattering (Samset et al., 2018; Li et al., 2022). This lack of observational data contributes significantly to uncertainty in aerosol modeling and, therefore, to the uncertainty of the aerosol radiative forcing.</p>
      <p id="d2e205">The difficulty of traditional libraries of aerosol optical and microphysical properties (Shettle and Fenn, 1979; Koepke et al., 1997; Hess et al., 1998) to describe geographical variation aerosol properties, for instance, soil dust mineralogy (Adebiyi et al., 2023), has been central in the aerosol optical properties uncertainty debate. Another critical aspect is the characterization of the state of the mixture of the aerosol particles in the model's aerosol modules (Samset et al., 2018; Sand et al., 2021). Given the complex dynamic of aerosol particle emission, transport, and removal in the atmosphere, numerical modelling of the state of the mixture and the resultant complex refractive index and size distribution is widely recognized as one of the most important sources of uncertainty in addressing aerosol particles' radiative forcing (Sand et al., 2021). According to Sand et al. (2021), aerosol absorption is poorly constrained, and the current climate models present a large range in the quantification of the main absorbing aerosol species – black carbon (BC), organic aerosols (OA), and mineral dust. Brown et al. (2021) findings indicate that biomass-burning aerosols in most climate models are too absorbing, mainly due to treatments of aerosol mixing state. They found the internal mixing assumptions used in climate models to overestimate Black Carbon (BC) absorption when compared to the observations. Saharan dust, a critical component of the global aerosol system, has been found to absorb less solar radiation than models estimate (Adebiyi et al., 2023), and the primary cause pointed out is the models' overestimation of the dust imaginary refractive index. Absorption is not the only issue facing aerosol particle representation in climate models; the relative contribution of fine and coarse mode particles is also a challenge. For instance, Adebiyi et al. (2023) also found models underestimating large dust particles when representing North African dust plumes.</p>
      <p id="d2e209">Observation-constrained models have been recommended to mitigate models' current difficulty in fully simulating aerosol properties and processes accurately (Samset et al., 2018; Proske et al., 2024). In addition to the uncertainty aspects, explicit simulation of aerosol composition and microphysical properties, followed by explicit computation of intensive optical properties, is still too expensive computationally for operational models, which also makes observational-based prescriptions a convenient solution. Zhong et al. (2022) used relationships from an ensemble of aerosol models and satellite observations to identify the primary source of uncertainty in aerosol modelling results in biomass burning regions. Their study pointed out the incorrect simulations of lifetimes and the underestimation of mass extinction coefficients as the main reasons for their difficulty in matching observed aerosol optical depth (AOD). As the largest, time and device-consistent observational network, capable of constraining multiple aerosol intensive microphysical and optical properties, the AErosol RObotic NETwork (AERONET) has been used worldwide to constrain models and satellite algorithms (Omar et al., 2005; Li et al., 2010; Levy et al., 2010; Rosário et al., 2013; Russell et al., 2014; Chen et al., 2023). Chen et al. (2023) developed an aerosol optical module with observation-constrained Black Carbon properties to improve aerosol absorption simulation. Their sensitivity simulations show a reduction of 18 %–69 % in the biases of aerosol single-scattering co-albedo when compared with global observations from AERONET. Li et al. (2010) used AERONET retrievals to evaluate and improve the performance of a GCM aerosol optical module. They found their GCM to simulate flatter Aerosol Optical Depth (AOD) spectral dependence, indicating an Angstrom Exponent (AE) biased to low values, which suggests that the aerosol sizes simulated were too large. After adjusting the aerosol's size based on AERONET retrievals, the agreement between simulated and observed AOD improved for all aerosol regimes, but especially for smoke and dust scenarios. Rosário et al. (2013) used a set of spectral optical models developed from AERONET sky retrievals over distinct biomes combined with the concept of anisotropic areas of influence of the AERONET sites (Hoelzemann et al., 2009) to constrain smoke aerosol radiative effect modelling during South American biomass burning. By doing so, they were able to capture the effect of the regional variability of smoke optical properties (absorption and size-related) on the surface solar irradiance related to the biomes' distinct nature of smoke.</p>
      <p id="d2e212">Global and regional cluster analysis of AERONET long-term retrievals of aerosol properties has proved valuable to classify observations in terms of aerosol optical regimes, providing means to qualitative constraints on aerosol properties (Omar et al., 2005; Levy et al., 2007; Russell et al., 2014; Li et al., 2019; Fan et al., 2021; Zhou et al., 2023). In these studies, the number of identified typical aerosol optical regimes varied from 4 to 10, numbers that were expected to likely represent either global or regional major aerosol scenarios, according to each study's focus. In their study, Zhou et al. (2023) found that regional aerosol regime classifications performed better than global classifications when applied to simulate AOD during pollution episodes and in different seasons in Beijing, China. They found larger differences between the strong and moderately absorbing aerosol regimes, namely dust and smoke regimes, when comparing global and regional clustering results. This is a consequence of the differences between China's regional dust and smoke aerosol particles' physical and chemical characteristics and those of global dust and smoke mean features. Another aspect highlighted by Zhou et al. (2023) is that smoke and dust-dominated optical regimes are more frequent globally than in China. Their result suggests that regional classification better captures typical aerosol optical regimes influencing a specific domain and, therefore, with the potential to improve observation-constrained simulations of aerosol radiative forcing.</p>
      <p id="d2e216">Focusing on the Iberian Peninsula (IP), this study sought to characterize the typical aerosol optical regimes driving the variability of aerosol-intensive properties over the peninsula, aiming to constrain aerosol optical properties prescription in atmospheric models using a novel machine-learning approach. IP is a region affected by a highly dynamic and complex set of aerosols mixing, including natural and anthropogenic particles (Cachorro et al., 2016; Gómez-Amo et al., 2017). Natural sources include marine aerosols from the Atlantic Ocean and Mediterranean Sea, mineral dust from North Africa, and, eventually, wildfire emissions. Major anthropogenic sources are urban-industrial, particularly in more densely populated regions, and biomass burning driven by human activities, especially in the north and central Portugal and eastern and northern Spain. Regional column-integrated optical properties are highly sensitive to the mixing of this diversity of aerosol types, in particular to dust and smoke mixing (Gómez-Amo et al., 2017).</p>
      <p id="d2e219">The manuscript is organized as follows: Sect. 2 includes a brief overview of the Iberian Peninsula, focusing on the main atmospheric circulation features and major aerosol particle sources affecting the region, followed by the description of the dataset and methods adopted to identify, characterize, and prescribe the identified aerosol typical regimes. Results and discussions are presented in Sect. 3. First, the identified aerosol optical regimes and their major features are described and contextualized. Subsequently, the results of the novel machine-learning approach to prescribing the optical regimes are discussed and evaluated. Finally, the main findings of our study are highlighted in the conclusion section.</p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Study region, data and methods</title>
<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>Study region</title>
      <p id="d2e237">The Iberian Peninsula (Fig. 1), comprising Spain and Portugal, exhibits diverse climate conditions due to its complex topography and proximity to the Atlantic Ocean, the Mediterranean Sea, and North Africa. The wind circulation over the peninsula is shaped by its location between the Atlantic Ocean and the Mediterranean Sea, diverse topography, and interactions between regional and global atmospheric patterns, leading to complex wind circulations that significantly influence the region's climate. This results in distinct climate zones, from arid deserts to lush green forests. The Mediterranean climate spans most of Spain, including the eastern and southern coastal regions and central Portugal, featuring hot and dry summers, especially inland. Winters are mild, rarely dropping below 10 °C in coastal areas. Most precipitation, often rain, occurs in autumn and winter, leading to dry summers that increase wildfire risks. Wildfires regularly occur in the IP region, fueled by extreme weather conditions, abnormal high temperature records combined with strong, dry winds (Asfaw et al., 2022; Ermitão et al., 2023). Under these scenarios, the entire region can be affected by smoke plumes that often shape the entire region's optical properties (Elias et al., 2004; Gómez-Amo et al., 2017). But wildfires are more frequent in the north and central region of Portugal and the north and eastern portion of Spain (Ermitão et al., 2023; Alvarez et al., 2024). Oceanic climate is typical in northern coastal regions of Spain, such as Galicia, Asturias, and the Basque Country, and parts of northern Portugal. The Atlantic Ocean influences mild temperatures year-round, with minimal seasonal variation and abundant, evenly distributed rainfall. Annual precipitation can exceed 1000 mm, with frequent cloud cover and high humidity, especially in winter. The Continental climate of the central plateau (Meseta Central) and the Ebro Valley feature extreme temperature variations, with hot summers, highs often above 35 °C, and winters below freezing. The central regions have less precipitation than the coastal areas, with a semi-arid climate in some parts. Most rainfall occurs in spring and autumn. Arid and Semi-Arid Climates are found in Southeastern Spain, especially in Murcia and Almería, and parts of the Ebro Valley. These areas receive very low rainfall, often less than 300 mm annually, leading to desert-like conditions like those in the Tabernas Desert. Summers are extremely hot, while winters are mild. Southern Spain, especially the Andalusian region, can be affected by hot and dry winds from the Sahara, causing heat waves and dust storms.</p>

      <fig id="F1" specific-use="star"><label>Figure 1</label><caption><p id="d2e242">AERONET sites locations displayed on top of the Iberian Peninsula topography.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f01.png"/>

        </fig>

      <p id="d2e251">The occurrence of Saharan dust events on the Iberian Peninsula usually peaks in March and June, with a marked minimum in April and lowest occurrence in winter according to Cachorro et al. (2016). Depending on the synoptic conditions and circulation patterns, dust transport can affect the entire peninsula (Toledano et al., 2007). The prevailing westerlies, blowing from west to east, are the dominant wind pattern over the Iberian Peninsula. These winds are most prominent in the mid-latitudes, including the Iberian Peninsula. More pronounced in the northern region during autumn and winter, these winds bring moist air from the Atlantic, increasing precipitation in Galicia, the Basque Country, and northern Portugal. While they also affect central and southern areas, their impact is moderated by the peninsula's topography and other wind systems. The northeast trade winds affect the southern and western coasts of Portugal and southwestern Spain, creating a mild and dry climate, especially in summer. In contrast, Mediterranean winds affect the eastern and southeastern coasts. Additionally, the Iberian Thermal Low, resulting from intense heating of the Iberian interior, creates a low-pressure area that draws air from the Atlantic and Mediterranean shores, leading to converging wind patterns. This circulation pattern enhances sea breeze penetration and moderates coastal temperatures. Southern Spain is influenced by the Sahara winds, as said, these dry winds often carry dust, increasing the temperature and reducing air quality. Calima is a type of wind that occurs when Saharan dust reaches the peninsula, especially in summer, causing hazy skies, a reddish tint, and low visibility. These winds are linked to high-pressure systems over North Africa and low-pressure systems over the western Mediterranean.</p>
      <p id="d2e255">The wind circulation over the Iberian Peninsula is a dynamic and complex system shaped by global atmospheric patterns, regional geography, and local topography. The interaction of prevailing westerlies, trade winds, Mediterranean breezes, and local wind systems creates a diverse wind regime that affects the peninsula's climate. Understanding these patterns is essential for weather prediction, agriculture management, and tackling environmental challenges. According to Cachorro et al. (2016), these complex and contrasting influences of air masses from the Atlantic Ocean, Mediterranean Sea, European continent, and North Africa lead to a large spatio-temporal variability in aerosol properties, types, and mixing processes over the Iberian Peninsula. This makes the peninsula a challenging region for online modeling of aerosol microphysical properties and mixing state, therefore an interesting region to evaluate observation-based approaches, such as those based on climatological aerosol intensive optical properties from AERONET (Li et al., 2019; Fan et al., 2021; Zhou et al., 2023). The computation of optical properties for radiative transfer computations is usually based on a mass-weighted average of individual species at each grid point. This assumption of external mixing may not always be accurate, leading to significant uncertainties, such as excessive absorption by smoke aerosols and inaccuracies in dust size fractions. Observation-based approaches, such as those provided by AERONET retrieval climatology, attribute intensive optical properties to an effective aerosol based on actual observations. This method aims to reduce the uncertainties arising from the explicit simulation of these properties in climate models. The Iberian Peninsula, influenced by a variety of aerosol types, including dust, smoke, urban-industrial emissions, and marine aerosols, presents an interesting region to test this hypothesis.</p>
</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title>AERONET aerosol inversion product</title>
      <p id="d2e266">AERONET is a global ground-based network of sun photometers mainly aimed at characterizing columnar aerosol particle properties (Holben et al., 1998). From the direct Sun attenuation measurements, AERONET algorithms derive spectral Aerosol Optical Depth (AOD<sub><italic>λ</italic></sub>) at the wavelengths 0.34, 0.38, 0.44, 0.50, 0.67, 0.87, 0.94, and 1.02 <inline-formula><mml:math id="M2" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>m. The interval between direct sun measurements is typically 15 minutes, but only cloud-free conditions are considered for aerosol retrievals. From the spectral dependency of AOD at these wavelengths, AERONET provides Angstrom Exponent (AE), a parameter sensitive to the aerosol particle size distribution (Eck et al., 1999). AERONET also provides several other intensive properties that depend not on the amount but on the nature of the aerosol, related to particle size, shape, and composition, from sky radiance measurements up to nine times a day at the wavelengths 0.44, 0.67, 0.87, and 1.02 <inline-formula><mml:math id="M3" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>m (Sinyuk et al., 2020). These intensive properties include microphysical parameters, such as refractive indices (<inline-formula><mml:math id="M4" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:math></inline-formula>) and volume size distribution, and also optical parameters like Single Scattering Albedo (SSA), asymmetry parameter (ASY), Lidar Ratio (LR), Linear Depolarization Ratio (LDR), Angstrom Exponent, among others (Holben et al., 1998; Dubovik et al., 2002). This set of aerosol intensive properties is expected to capture most of the important aspects that differentiate the distinct aerosols' optical regimes that affect the study region. For instance, the imaginary part of the complex refractive index (<inline-formula><mml:math id="M5" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>) and single scattering albedo (SSA) are properties that separate highly absorbing aerosol regimes from moderate and low absorbing regimes. Angstrom Exponent (AE) and Asymmetry Parameter (ASY) are properties that help separate aerosol regimes characterized by distinct size distributions. LR is highly sensitive to size and composition-related information, for instance, the real part of the complex refractive index. Meanwhile, LDR has high sensitivity to particle morphology, and it is widely used to separate dust particles from other aerosol types. Given the dependency of these intensive properties on the aerosol type (size and composition) and mixed state, it is possible to characterize the aerosol scenarios over a specific AERONET site in terms of their nature and sources (Eck et al., 1999; Dubovik et al., 2002). For instance, the LR is the ratio of the extinction coefficient to the backscatter coefficient and is crucial for identifying different aerosol types. It reflects how light scattering varies with particle size relative to the light wavelength. Small particles, like smoke, have a high LR, while large particles, like sea salt, have a low LR. Therefore, with a well-distributed regional network of AERONET's sun photometers, as that covering the Iberian Peninsula, one can characterize the spatial dynamics of aerosol types and mixture state influencing the regional aerosol regimes. Regarding the time period for the current study, it extends from 2003 to 2023. However, due to calibration and other operational aspects, some AERONET sites present different time ranges within this period.</p>
      <p id="d2e315">Three key aspects of aerosol nature have been widely used to link aerosol regimes with particle emission sources. These aspects are absorption efficiency, size distribution, and shape (Dubovik et al., 2002). For instance, combustion-based sources, including biomass and fossil fuel burning, produce aerosol dominated by fine mode particles, and absorption ranges from moderate to strong, depending on the nature of biomass burning, fossil fuel, and ageing processes. In contrast, natural sources, such as deserts and marine environments, produce aerosols dominated by coarse-mode particles. Marine aerosol particles are characterized by very low absorption, while dust aerosol can exhibit high absorption, mainly in the UV and VIS bands (Smirnov et al., 2002; Dubovik et al., 2002). Furthermore, the irregular shape of dust particles is a key factor that differentiates them from other aerosol types. This distinctive feature is captured by AERONET retrievals of the LDR (Shin et al., 2018). Source attribution provides valuable insights into the typical intensive optical properties affecting the atmospheric column of a site resulting from complex aerosol state mixtures. This understanding is crucial as it addresses a major challenge that current aerosol modules in CMIP6 climate models face (Zhao et al., 2022). Reproducing climatological aerosol-intensive properties scenarios over specific regions has been a major goal of atmospheric models. In addition to evaluating aerosol modules in atmospheric models, AERONET's optical properties in typical regimes, which can be expressed as spectral aerosol optical models (Omar et al., 2005; Levy et al., 2007; Rosário et al., 2013; Zhou et al., 2023), are valuable for simulating aerosol direct radiative effects in environmental models (Rosário et al., 2013; Li et al., 2019). This approach is especially beneficial when high computational capacity is unavailable and explicit aerosol modules are not feasible.</p>
      <p id="d2e318">With more than 25 years of operating a vast network of Cimel Electronique Sun–sky radiometers across the world, AERONET has provided highly accurate, ground-truth measurements of aerosol optical depth and other properties (Giles et al., 2019). It has been widely used as the main reference to evaluate and validate satellites (Gupta et al., 2018) and model products (Gliß et al., 2021). The two most critical intensive optical properties to estimating aerosol radiative forcing retrieved by AERONET, single scattering albedo (SSA) and asymmetry parameter (ASY), are related, respectively, to absorption and size of the aerosol. Their accuracies are aerosol loading dependent (Dubovik et al., 2002). For AOD <inline-formula><mml:math id="M6" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> 0.4 at 440 nm (or <inline-formula><mml:math id="M7" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0.2</mml:mn></mml:mrow></mml:math></inline-formula> at longer <inline-formula><mml:math id="M8" display="inline"><mml:mi mathvariant="italic">λ</mml:mi></mml:math></inline-formula>), SSA uncertainty <inline-formula><mml:math id="M9" display="inline"><mml:mo>≈</mml:mo></mml:math></inline-formula> <inline-formula><mml:math id="M10" display="inline"><mml:mrow><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.03</mml:mn></mml:mrow></mml:math></inline-formula>, for lower AOD, uncertainty can be <inline-formula><mml:math id="M11" display="inline"><mml:mrow><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.05</mml:mn></mml:mrow></mml:math></inline-formula>–0.07 or larger. Regarding ASY, uncertainty is about <inline-formula><mml:math id="M12" display="inline"><mml:mrow><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.02</mml:mn></mml:mrow></mml:math></inline-formula>–0.05 when AOD is high (<inline-formula><mml:math id="M13" display="inline"><mml:mrow><mml:mo>≥</mml:mo><mml:mn mathvariant="normal">0.4</mml:mn></mml:mrow></mml:math></inline-formula> at 440 nm, <inline-formula><mml:math id="M14" display="inline"><mml:mrow><mml:mo>≥</mml:mo><mml:mn mathvariant="normal">0.2</mml:mn></mml:mrow></mml:math></inline-formula> at longer wavelengths) but can be significantly larger at low AOD.</p>
      <p id="d2e403">Aiming to identify a representative set of typical aerosol regimes that affect the Iberian Peninsula, we applied cluster analysis methods (described in Sect. 2.4) to the AERONET sky radiance retrievals dataset from 2003 to 2023, taking advantage of the extensive coverage of AERONET sites across the region. Within that period, a total of 4395 retrievals from AERONET Level 2.0 retrievals products were obtained and applied in the clustering process. Table 1 presents a set of intensive properties provided by AERONET that was used to identify typical aerosol scenarios in the Iberian Peninsula atmospheric column. The variables displayed cover all three previously mentioned aspects, absorption efficiency, size distribution, and shape, which are expected to characterize the distinct nature of aerosol types and mixture anticipated in the study region.</p>

<table-wrap id="T1" specific-use="star"><label>Table 1</label><caption><p id="d2e410">List of AERONET inversions products (variables) used in clustering process followed by their abbreviation as defined by AERONET.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="2">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Variables</oasis:entry>
         <oasis:entry colname="col2">Abbreviation</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Refractive index – real part</oasis:entry>
         <oasis:entry colname="col2">RI<sub>Real</sub>(440), RI<sub>Real</sub>(670), RI<sub>Real</sub>(870), RI<sub>Real</sub>(1020)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Refractive index – imaginary part</oasis:entry>
         <oasis:entry colname="col2">RI<sub>Imag</sub>(440), RI<sub>Imag</sub>(670), RI<sub>Imag</sub>(870), RI<sub>Imag</sub>(1020)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Single scattering albedo</oasis:entry>
         <oasis:entry colname="col2">SSA(440), SSA(670), SSA(870), SSA(1020)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Asymmetry parameter</oasis:entry>
         <oasis:entry colname="col2">ASY(440), ASY(670), ASY(870), ASY(1020)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Linear depolarization ratio</oasis:entry>
         <oasis:entry colname="col2">LDR(440), LDR(670), LDR(870), LDR(1020)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Lidar ratio</oasis:entry>
         <oasis:entry colname="col2">LR(440), LR(670), LR(870), LR(1020)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Fine and coarse modes volume median radius</oasis:entry>
         <oasis:entry colname="col2">VMR-F,VMR-C</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Standard deviation from volume median radius, for fine and coarse modes</oasis:entry>
         <oasis:entry colname="col2">STD-F, STD-C</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Fine and coarse modes effective radius</oasis:entry>
         <oasis:entry colname="col2">Reff-F, Reff-C</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e591">We selected only AERONET sites that operated for at least two years and that have sky radiance inversion available with the highest quality level 2.0. Some selected sites are still operational, while others have been discontinued. Figure 1 illustrates the geographical distribution of the chosen sites. Our selection encompasses various landscapes of the Iberian Peninsula, from coastal plains regions (Coruña, Sagres, Burjassot) to highland plateaus in the interior (Madrid, Valladolid, Aras-de-los-Olmos) and lowland valleys (Zaragoza, Murcia). Regarding external air mass influence, sites in the southern border of IP are typically the first to experience the transport of dusty air masses from North Africa, with locations such as El-Arenosillo, Huelva, Malaga, and Sagres affected. The eastern sites (Barcelona, Burjassot, and Murcia) are expected to be strongly influenced by the Mediterranean air masses. Western and northern sites (Cabo da Roca, Coruna, Sagres) are directly under the influence of air mass from the Atlantic Ocean. Additionally, the Portuguese countryside (Evora) and eastern Spanish sites (Badajoz, Caceres) are located in regions that very often experience biomass burning during the dry season (Ermitão et al., 2023; Silva et al., 2023; Hammed et al., 2024; Alvarez et al., 2024).</p>
</sec>
<sec id="Ch1.S2.SS3">
  <label>2.3</label><title>Merra-2 aerosol diagnostic product</title>
      <p id="d2e602">The MERRA-2 (Modern-Era Retrospective Analysis for Research and Applications, Version 2) Aerosol Diagnostic Product (ADP) is a comprehensive dataset provided by NASA that offers global information about atmospheric aerosols (Gelaro et al., 2017; Buchard et al., 2017). MERRA-2 combines observational data with numerical models (reanalysis project) to create a detailed long-term record of atmospheric dynamics and composition from 1980 to the present. Among other variables, the MERRA-2 ADP product offers a long-term view of aerosol mass distribution by types and the related optical properties (Buchard et al., 2017). Its extended temporal coverage allows analysis of aerosol trends, such as those related to changes in atmospheric composition due to human activity and the impact on climate. Key features of the MERRA-2 ADP include aerosol microphysical and optical properties such as optical depth, mass concentration, and size distribution. These properties are crucial for understanding aerosol loading and composition in the atmosphere and their role in the Earth's radiation budget and climate system. A key aspect of MERRA-2 APD for this study is that it provides aerosol-type column mass density, our target variable as a predictor of aerosol optical model regime. The MERRA-2 APD includes diagnostics for the aerosol types considered in most chemistry transport models: Dust (DT), Black-Carbon (BC), Organic Carbon (OC), Sea-Salt (SS), and Sulfate (SF). The aerosol-type diagnostics variables cover mass concentration at specific levels and are integrated into the entire atmospheric column, which are applied to estimate columnar optical properties, such as extinction, scattering, and absorption optical depths, at multiple wavelengths. For this study, the 550 nm wavelength was used as a reference. Optical properties are a function of aerosol species, particle size, and relative humidity. To convert from the simulated aerosol masses to optical quantities such as aerosol optical depth, MERRA-2 uses Optics look-up tables (LUTs) derived from Mie calculations using parameters from the Optical Properties of Aerosols and Clouds (OPAC; Hess et al., 1998), as described in Chin et al. (2002) and Colarco et al. (2010), except for dust-type aerosol, which is based on Colarco et al. (2014). Therefore, these optical properties are by-products of running the MERRA-2 reanalysis system and made available to the community via MERRA-2 ADP. Further details on this can be found in Buchard et al. (2017). From these extensive aerosol-driven optical properties, it is possible to derive several MERRA-2 ADP intensive optical properties, such as Single Scattering Albedo (SSA).</p>
      <p id="d2e605">Given that the aerosol optical properties retrieved from each AERONET site are influenced by mixtures of different aerosol types, it is reasonable to assume that the impact of each aerosol type on the column's intensive optical properties is primarily determined by its concentration. Based on this premise, we propose a machine-learning approach that utilizes the aerosol-type column mass density predicted by chemistry transport models to prescribe the most accurate possible spatial distribution of the aerosol spectral optical model developed through cluster analysis of AERONET data. A description of the method presented in this study, exploring MERRA-2 products, can be found in Sect. 2.5.</p>
</sec>
<sec id="Ch1.S2.SS4">
  <label>2.4</label><title>Optical models development: cluster analysis</title>
      <p id="d2e616">Cluster analysis has been extensively used to develop aerosol optical models based on AERONET sky inversion products (Omar et al., 2005; Levy et al., 2007; Russell et al., 2014). The underlying principle is that AERONET instantaneous retrievals can be grouped into a certain number of clusters, each representing different categories of aerosol regimes. These studies have explored mainly the <inline-formula><mml:math id="M23" display="inline"><mml:mi>K</mml:mi></mml:math></inline-formula>-means clustering method, one of the most popular unsupervised machine learning algorithms for partitioning a dataset into a pre-defined number of clusters. However, specifying the number of clusters in advance poses a significant challenge for the <inline-formula><mml:math id="M24" display="inline"><mml:mi>K</mml:mi></mml:math></inline-formula>-means method. Fortunately, there are techniques available that reduce the subjectivity involved in this pre-definition. In our study, we adopted the Elbow method (Shi et al., 2021), a widely used method for determining the optimal number of clusters (<inline-formula><mml:math id="M25" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>) in a <inline-formula><mml:math id="M26" display="inline"><mml:mi>K</mml:mi></mml:math></inline-formula>-Means clustering algorithm. It examines the relationship between a range of number of clusters and the Within-Cluster Sum of Squares (WCSS), which measures the variance within each cluster (Eq. 1)

            <disp-formula id="Ch1.E1" content-type="numbered"><label>1</label><mml:math id="M27" display="block"><mml:mrow><mml:mi mathvariant="normal">WCSS</mml:mi><mml:mo>=</mml:mo><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>k</mml:mi></mml:munderover><mml:munder><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>x</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>C</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:munder><mml:mi mathvariant="normal">|</mml:mi><mml:mfenced open="|" close="|"><mml:mrow><mml:mi>x</mml:mi><mml:mo>-</mml:mo><mml:msub><mml:mi mathvariant="italic">μ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:msup><mml:mi mathvariant="normal">|</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></disp-formula>

          where <inline-formula><mml:math id="M28" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula> is the number of cluster <inline-formula><mml:math id="M29" display="inline"><mml:mrow><mml:msub><mml:mi>C</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the set of point in a cluster <inline-formula><mml:math id="M30" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="italic">μ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the centroid of cluster <inline-formula><mml:math id="M31" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>, and <inline-formula><mml:math id="M32" display="inline"><mml:mrow><mml:msup><mml:mfenced open="|" close="|"><mml:mrow><mml:mi>x</mml:mi><mml:mo>-</mml:mo><mml:msub><mml:mi mathvariant="italic">μ</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> is the squared Euclidean distance. The WCSS measures the compactness of the clustering, and one wants it to be as small as possible. If clusters are tight and well-separated, WCSS will be small, because points are close to their centroids. If clusters are loose or overlapping, WCSS will be large. The Elbow method is based on a plot of WCSS (<inline-formula><mml:math id="M33" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>) against the number of clusters (<inline-formula><mml:math id="M34" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>). As <inline-formula><mml:math id="M35" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula> increases, WCSS always decreases; more clusters mean tighter groups. The goal of the method is to identify the point (<inline-formula><mml:math id="M36" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>) where the rate of decrease in WCSS sharply slows down, indicating that adding more clusters yields diminishing returns. We ran our clustering algorithm with <inline-formula><mml:math id="M37" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula> varying from 2 to 10 clusters. For each <inline-formula><mml:math id="M38" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>, we calculated the total WCSS. The <inline-formula><mml:math id="M39" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula> results against WCSS were displayed in a plot, and the optimal number of clusters was defined based on the location (<inline-formula><mml:math id="M40" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>) of the bend (elbow) in the plot from which the change in WCSS slows down. This bend in the curve indicates the point where adding more clusters no longer gives meaningful improvement.</p>
      <p id="d2e815">The Elbow method has been widely used because of its straightforward approach to estimating the most appropriate number of clusters. However, we recognize that it still carries a certain degree of subjectivity, as it relies on visual interpretation. To reduce this subjectivity, we combined the Elbow and Stability methods to evaluate the optimal number of clusters that best represent the major aerosol regimes affecting the study region. Although more rigorous methods are available in the literature, defining the number of clusters remains a challenge, and different approaches often lead to distinct solutions (Krishnaveni et al., 2023). Nevertheless, despite the limitations of the Elbow method, the number of clusters identified in our study seems to provide a coherent characterization of optical regimes affecting the Iberian Peninsula.</p>
      <p id="d2e818">The <inline-formula><mml:math id="M41" display="inline"><mml:mi>K</mml:mi></mml:math></inline-formula>-means clustering analysis was performed using Scikit-learn, a Python open source machine learning library that supports supervised and unsupervised learning (Abraham et al., 2014). All our analyses were performed using the Scientific PYthon Development EnviRonment (Spyder), an open-source IDE for the Python language. As part of the preprocessing step, the values of the features listed in Table 1 were normalized using the <italic>StandardScaler</italic>( ) utility from <italic>sklearn.preprocessing</italic> package, which computes the mean and standard deviation. Then the scaled dataset was obtained subsequently by subtracting all values of the features from their respective mean and normalized by the corresponding standard deviation. With this scaling process we expected to avoid the dominance of features with large numeric ranges.</p>
      <p id="d2e835">To evaluate the robustness of the clustering results, a set of sensitivity analysis using the Scikit-learn library was performed. These tests were meant to test numerical stability, sampling robustness, clusters reproducibility, separation quality and presence of transitional regimes. A summary with all the results of these performed tests can be seen in the Supplement. First, a jitter robustness test was conducted by adding Gaussian noises taking different uncertainty estimates (5 %, 10 %, 20 %) to the standardized feature matrix and re-running the clustering algorithm multiple times (200 runs). The resulting partitions were compared with the original clustering using the Adjusted Rand Index (ARI), which assesses the sensitivity of the clustering structure to perturbations in feature space (mimicking features uncertainties). Second, a bootstrap robustness analysis was implemented by repeatedly resampling the dataset with replacement and recomputing the clustering solution for each resampled dataset. The ARI between the original and bootstrap-derived clusterings was calculated to evaluate the dependence of the clustering structure on specific samples and to test its reproducibility under data variability. In general, the mean ARI results for both jitter and bootstrap robustness analysis (Table S3) presented values above 0.80, which indicate high similarity between the originally predicted clusters and the perturbed, which support the clustering structure robustness to random noises.</p>
      <p id="d2e839">Cluster-level stability was quantified using a cluster retention score, defined as the average probability that members of an original cluster remain grouped together across perturbation runs also applying gaussian noises references (5 %, 10 %, 20 %) to the standardized feature matrix and re-running the clustering algorithm multiple times (200 runs). This metric allows identification of highly stable regimes as well as potentially transitional or mixed clusters. With most of the cluster retention scores above 0.95 (Table S4), results show that the obtained cluster regimes are highly stable. The exception is cluster 3, which presented a retention score of 0.88, which can be considered stable but somewhat overlapping. Finally, a consensus (co-assignment) matrix was constructed by computing, for every pair of samples, the proportion of runs in which the two samples were assigned to the same cluster. From this matrix, mean intra-cluster and inter-cluster co-assignment probabilities were derived to quantify internal cohesion and external separation (Table S5 in the supplement). The results of high intra-cluster probability (<inline-formula><mml:math id="M42" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0.85</mml:mn></mml:mrow></mml:math></inline-formula>) and low inter-cluster probability (<inline-formula><mml:math id="M43" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0.10</mml:mn></mml:mrow></mml:math></inline-formula>) show that in general members of the same cluster are consistently grouped together, which corroborates the quality of the clustering results. This test was also conducted by adding gaussian noises considering different uncertainty estimates (5 %, 10 %, 20 %).</p>
      <p id="d2e862">Together, these diagnostics provide a comprehensive evaluation of clustering stability, reproducibility, and structural robustness.</p>
</sec>
<sec id="Ch1.S2.SS5">
  <label>2.5</label><title>Optical models spatial prescription: random forest technique</title>
      <p id="d2e874">Once the optimal number of clusters is defined, which corresponds to the expected number of major optical properties regimes to influence the study region, and the clustering process is performed, each cluster is characterized by a set of AERONET instantaneous retrievals of optical and microphysical properties that are expected to express an optical property regime. Also, each AERONET instantaneous retrieval is tagged with the cluster number that it belongs to. By averaging the instantaneous properties of each cluster, we set the reference values that represent the mentioned major aerosol optical properties regimes.</p>
      <p id="d2e877">We propose a machine-learning approach that utilizes the well-known random forests supervised algorithm (Breiman, 2001) to spatially represent the aerosol optical models defined by the cluster analysis for each AERONET site (described in Sect. 2.4). The implemented method was tested using exclusively aerosol column mass density fields from MERRA-2 (Table 2) to establish the spatial distribution of the optical regime defined by the cluster's average. This approach is also suitable for chemistry transport models.</p>

<table-wrap id="T2" specific-use="star"><label>Table 2</label><caption><p id="d2e883">Predictor variables from Merra-2 (aerosol-type column mass density) used in the machine learning process to prescribe the aerosol optical regime (optical model).</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="4">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="center"/>
     <oasis:colspec colnum="4" colname="col4" align="center"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Variables</oasis:entry>
         <oasis:entry colname="col2">Abbreviation</oasis:entry>
         <oasis:entry colname="col3">Unity</oasis:entry>
         <oasis:entry colname="col4">Spatial</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4">resolution</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Dust column mass density</oasis:entry>
         <oasis:entry colname="col2">DUCMASS</oasis:entry>
         <oasis:entry colname="col3">kg m<sup>−2</sup></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M45" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.5</mml:mn><mml:mi mathvariant="italic">°</mml:mi><mml:mo>×</mml:mo><mml:mn mathvariant="normal">0.625</mml:mn><mml:mi mathvariant="italic">°</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Black carbon column mass density</oasis:entry>
         <oasis:entry colname="col2">BCCMASS</oasis:entry>
         <oasis:entry colname="col3">kg m<sup>−2</sup></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M47" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.5</mml:mn><mml:mi mathvariant="italic">°</mml:mi><mml:mo>×</mml:mo><mml:mn mathvariant="normal">0.625</mml:mn><mml:mi mathvariant="italic">°</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Organic carbon column mass density</oasis:entry>
         <oasis:entry colname="col2">OCCMASS</oasis:entry>
         <oasis:entry colname="col3">kg m<sup>−2</sup></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M49" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.5</mml:mn><mml:mi mathvariant="italic">°</mml:mi><mml:mo>×</mml:mo><mml:mn mathvariant="normal">0.625</mml:mn><mml:mi mathvariant="italic">°</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">SO<sub>2</sub> column mass density</oasis:entry>
         <oasis:entry colname="col2">SO2CMASS</oasis:entry>
         <oasis:entry colname="col3">kg m<sup>−2</sup></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M52" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.5</mml:mn><mml:mi mathvariant="italic">°</mml:mi><mml:mo>×</mml:mo><mml:mn mathvariant="normal">0.625</mml:mn><mml:mi mathvariant="italic">°</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">SO<sub>4</sub> column mass density</oasis:entry>
         <oasis:entry colname="col2">SO4CMASS</oasis:entry>
         <oasis:entry colname="col3">kg m<sup>−2</sup></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M55" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.5</mml:mn><mml:mi mathvariant="italic">°</mml:mi><mml:mo>×</mml:mo><mml:mn mathvariant="normal">0.625</mml:mn><mml:mi mathvariant="italic">°</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Sea salt column mass density</oasis:entry>
         <oasis:entry colname="col2">SSCMASS</oasis:entry>
         <oasis:entry colname="col3">kg m<sup>−2</sup></oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M57" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.5</mml:mn><mml:mi mathvariant="italic">°</mml:mi><mml:mo>×</mml:mo><mml:mn mathvariant="normal">0.625</mml:mn><mml:mi mathvariant="italic">°</mml:mi></mml:mrow></mml:math></inline-formula></oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e1193">MERRA-2 time series of column mass density for each aerosol type (DT, BC, OC, SS, SF) over each AERONET site were collocated with the network inversion products used to derive the clusters representing the distinct aerosol regimes over the Iberian Peninsula (described in Sect. 2.4). Only MERRA-2 column mass density fields were used in the Random Forest training process; optical properties fields from the reanalysis system were not used at this stage. Merra-2 column mass densities are available with a frequency of 1 h, while AERONET optical properties instantaneous retrievals are provided at irregular times, due to its dependence on cloud cover and AOD criteria (AOD at 440 nm <inline-formula><mml:math id="M58" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> 0.4). So, for each AERONET retrieval, our script searches for the MERRA-2 closest hour to synchronize the two datasets. Therefore, the collocation between AERONET retrievals and MERRA-2, for a spatial matching we considered the nearest neighbor by taking the MERRA-2 grid cell that contains the AERONET station location, and for temporal collocation MERRA-2 hourly aerosol diagnostics were matched to the closest AERONET observation time. Each AERONET instantaneous aerosol microphysical and optical properties inversion retrieval (Sinyuk et al., 2020) was connected to the corresponding cluster to which it belongs. Likewise, as mentioned, each instantaneous aerosol microphysical and optical properties inversion retrieval was also connected to the closest in-time combination of MERRA-2 data of aerosol-type column mass density (DT, BC, OC, SS, SF). With this, we built a time series of 4309 points of spatial and temporal collocated MERRA-2 aerosol types of column mass density with the developed clusters occurrences over each AERONET site, which was used in a training process aiming to predict the suitable cluster given a specific combination of aerosol types column mass density predicted by MERRA-2. This time series was randomly divided into training and testing subsets, with 70 % (3016 collocated combinations) of the data used for model training and 30 % (1293 collocated combinations) reserved for independent evaluation. This was done using the train_test_split utility from the Scikit-learn library (Abraham et al., 2014).</p>
      <p id="d2e1203">The algorithm uses training data to learn the relationship between the combination of aerosol-types' columnar mass density and the target, which are the previously developed clusters from AERONET aerosol-intensive properties. The training was done using the Random Forest Classification algorithm (RandomForestClassifier) from Scikit-Learn.</p>
      <p id="d2e1206">We used stratified <inline-formula><mml:math id="M59" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-fold cross-validation integrated within a RandomizedSearchCV hyperparameter optimization process as a strategy. Our hyperparameter optimization was performed using RandomizedSearchCV with five-fold cross-validation. The search space included the number of trees (n_estimators) sampled uniformly between 50 and 500 and the maximum tree depth (max_depth) sampled between 1 and 20. A total of five random hyperparameter combinations were evaluated, and the best-performing model was refitted on the full training dataset. The random search methodology was used to find parameter combinations inside the parameter space without the processing demands of grid search and with the stratified <inline-formula><mml:math id="M60" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-fold cross-validation we search to ensure that each fold has approximately the same class proportions as the full dataset, which allows a fair evaluation, since every validation set includes samples from all classes. This also contributes to the meaning of the performance metrics in relation to the minority classes, for example strong absorbing aerosol regimes. The stratified <inline-formula><mml:math id="M61" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-fold also favours a more stable training, given that in every training split the less frequent aerosol property regimes are also seen, which helps to reduce variance in model performance across folds. This strategy contributes to improving the hyperparameter tuning, once the RandomizedSearchCV won't select parameters based on misleading folds. So, by preserving class distribution in every fold and preventing biased results, the strategy based on stratified <inline-formula><mml:math id="M62" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-fold cross-validation helps to handle class imbalance, which in turn improves the model reliability and generalization. Class imbalance is typical in atmospheric aerosol characterization, where extreme but radiatively important aerosol regimes, like intense smoke episodes, are rare compared to more common background conditions. Therefore, with the strategy described, we also aimed to address the issues of class imbalance of aerosol regime classification in our study.</p>
      <p id="d2e1237">Cross-validated performance indicators were used to select the final configuration in order to reduce overfitting and ensure consistent performance across aerosol regimes. To evaluate model performance across aerosol regimes, and not to rely only on the overall accuracy, the performance metrics were computed individually for each regime</p>
      <p id="d2e1240">The confusion matrix utility from the Scikit-learn library (confusion_matrix) was used to visualize the performance of the models by comparing true labels with predicted labels. It allowed us to evaluate performance for each class individually and to support the interpretation of the per-class metrics calculated, namely Accuracy, Precision and Recall, and <inline-formula><mml:math id="M63" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> score. While the confusion matrix provides the context that explains the model performance, the per-class metrics provide numerical performance values for each class.</p>
      <p id="d2e1254">Accuracy represents the number of correctly classified data instances over the total; it checks the predictions against the actual values in the test set and returns the percentage of times the model got right. Precision and recall are two critical metrics for evaluating the performance of a classification model. Precision is the proportion of true positives among all the predicted positive cases (true and false), meaning it measures the accuracy of positive predictions (Eq. 2). Recall is the proportion of true positives among all actual positive cases (true and false), meaning it measures the model's ability to identify positive cases (Eq. 3). The <inline-formula><mml:math id="M64" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> score, the harmonic mean of a model's precision and recall, takes both precision and recall and provides a more balanced measure of a model's performance (Eq. 4). The <inline-formula><mml:math id="M65" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> score is set to be a value between 0 and 1, indicating, respectively, poor precision and recall and high precision and recall, which is ideal. 

                <disp-formula specific-use="align" content-type="numbered"><mml:math id="M66" display="block"><mml:mtable displaystyle="true"><mml:mlabeledtr id="Ch1.E2"><mml:mtd><mml:mtext>2</mml:mtext></mml:mtd><mml:mtd><mml:mstyle class="stylechange" displaystyle="true"/></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:mi mathvariant="normal">Precision</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mi mathvariant="normal">True</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi mathvariant="normal">positive</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi mathvariant="normal">True</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi mathvariant="normal">positive</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">False</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi mathvariant="normal">positive</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mtd></mml:mlabeledtr><mml:mlabeledtr id="Ch1.E3"><mml:mtd><mml:mtext>3</mml:mtext></mml:mtd><mml:mtd><mml:mstyle displaystyle="true" class="stylechange"/></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:mi mathvariant="normal">Recall</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mi mathvariant="normal">True</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi mathvariant="normal">positive</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi mathvariant="normal">True</mml:mi><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi mathvariant="normal">positive</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">False</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi mathvariant="normal">negative</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mtd></mml:mlabeledtr><mml:mlabeledtr id="Ch1.E4"><mml:mtd><mml:mtext>4</mml:mtext></mml:mtd><mml:mtd><mml:mstyle displaystyle="true" class="stylechange"/></mml:mtd><mml:mtd><mml:mrow><mml:mstyle displaystyle="true" class="stylechange"/><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>×</mml:mo><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Precision</mml:mi><mml:mo>×</mml:mo><mml:mi mathvariant="normal">Recall</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Recall</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">Precision</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mtd></mml:mlabeledtr></mml:mtable></mml:math></disp-formula></p>
      <p id="d2e1408">To identify which aerosol types most influence aerosol regime prescription and to understand whether meaningful types are driving predictions, we used the best_rfc.feature_importances_, an utility in scikit-learn's RandomForestClassifier, to calculate the scores indicating the importance of each aerosol types in the training dataset. The importance of an aerosol type in making predictions was based on how much it reduces impurity across all trees. Each decision tree in the forest splits data using different features, and each split reduces impurity. The reduction in impurity is attributed to the feature used at that split. An aerosol type importance is based on the frequency that it is used to split nodes.</p>
</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Results</title>
      <p id="d2e1420">The results section is divided into three subsections. The first one presents the results of identifying the typical aerosol optical regimes affecting the Iberian Peninsula using cluster analysis. The second subsection discusses the results and the performance of spatial prescription of these typical aerosol regimes by applying machine learning (Random Forest) to the columnar density of MERRA-2 aerosol components. Finally, case studies applying the method developed are presented and discussed.</p>
<sec id="Ch1.S3.SS1">
  <label>3.1</label><title>Cluster analysis: optical models development</title>
      <p id="d2e1430">The number of clusters (<inline-formula><mml:math id="M67" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>) selected to characterize the typical optical aerosol regimes over the Iberian Peninsula was defined based on the Elbow method (Fig. 2), which indicated five clusters were the optimal number to capture the aerosol regime variability. We also evaluated from the Elbow method that there is a sharp bending at <inline-formula><mml:math id="M68" display="inline"><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula>, which we associated with a clustering separation between aerosol regimes strongly dominated by coarse mode, dust regimes, and regimes dominated by fine mode, non-dust regimes. However, to cover more specific regimes within these two macro-regimes (dust regimes vs. non-dust regimes), a higher <inline-formula><mml:math id="M69" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula> is required, and <inline-formula><mml:math id="M70" display="inline"><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> is revealed to be the second sharpest bending. Cluster stability as a function of the number of clusters was also evaluated as a way of evaluating whether the clusters obtained are meaningful and not just artifacts of randomness or noise. High stability suggests clusters represent real structure in the data, not just random fluctuations. The stability for <inline-formula><mml:math id="M71" display="inline"><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> is above the 90 % threshold, similar to <inline-formula><mml:math id="M72" display="inline"><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:math></inline-formula>, a number after which stability sharply decreases. Therefore, combining the Elbow method and stability reinforced <inline-formula><mml:math id="M73" display="inline"><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> as an optimal cluster number to capture the typical aerosol scenarios over the Iberian Peninsula, reducing the subjectivity usually associated with the <inline-formula><mml:math id="M74" display="inline"><mml:mi>K</mml:mi></mml:math></inline-formula>-means clustering method.</p>

      <fig id="F2"><label>Figure 2</label><caption><p id="d2e1517">Average of sum of squares within-cluster and cluster stability as function of the number of clusters.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f02.png"/>

        </fig>

      <p id="d2e1526">We applied the cluster analysis once we defined the optimal number of clusters. As described, the result for clustering process robustness was assessed using the fraction of points changing cluster membership relative to the original classification by perturbing the input data by <inline-formula><mml:math id="M75" display="inline"><mml:mrow><mml:mo>±</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> SD (standard deviation) and rerun the <inline-formula><mml:math id="M76" display="inline"><mml:mi>K</mml:mi></mml:math></inline-formula>-means clustering. The fraction of points changing cluster assignment was 15.3 % for the <inline-formula><mml:math id="M77" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> SD perturbation and 17.6 % for the <inline-formula><mml:math id="M78" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> SD perturbation, yielding a mean sensitivity of 16.5 %. Only 0.5 % of points changed cluster membership under both perturbations, indicating that the observed sensitivity is largely confined to boundary points, while the cluster cores remain robust.</p>
      <p id="d2e1567">Figure 3 presents a combination of graphics used for aerosol properties analysis, highlighting the obtained clusters' behavior and distinction. The first graphic (Fig. 3a) represents the Aerosol Optical Depth (AOD) as a function of Angstrom Exponent (AE), which allows us to relate aerosol loading variability with aerosol regimes dominated either by coarse or fine mode (Eck et al., 1999). This analysis shows that two of the clusters (C0 and C1) are regimes dominated by coarse mode particles (AE <inline-formula><mml:math id="M79" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 1.0), while the remaining three (C2, C3, and C4) are regimes under the stronger influence of fine mode particles (AE <inline-formula><mml:math id="M80" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> 1.0). The second plot displays the asymmetric parameter against the single scattering albedo at 440 nm. This plot aims to elucidate the clusters' distinctions related to particle absorption efficiency and the asymmetry between hemispherical forward and backward scattering. Aerosol regimes dominated by coarse particles tend to exhibit more significant forward scattering and, consequently, higher asymmetry parameter values. In contrast, lower asymmetry parameter values are expected in fine mode regimes (Eck et al., 1999; Dubovik et al., 2002). This pattern is evident in the graphic; clusters C0 and C1 present higher asymmetry parameter values. It is also possible to identify the distinction between the non-dust regimes C2, C3, and C4. C2 presents the lowest asymmetry parameter values, while it is the most absorbing of the clusters, according to its single scattering albedo values. Small and highly absorbing particles are commonly associated with urban pollution or fresh smoke plumes from biomass burning (Dubovik et al., 2002; Omar et al., 2005; Levy et al., 2010; Martins et al., 2009). The C3 cluster differs significantly from C2 by presenting higher asymmetry parameter values, an indication of a shift to larger particle sizes. C3 has higher single-scattering albedo values, indicating a less absorbing aerosol regime. SSA alone did not help to differentiate the two clusters dominated by coarse mode particles (C0 and C1). C0 asymmetry parameter values tend to be lower than those of C1, suggesting that the former could be a dusty mixture not as close to a pure dust scenario as C1. The traditional plot of Lidar Ratio (LR) against Linear Depolarization Ratio (LDR) (Kanitz et al., 2013; Illingworth et al., 2015) confirms this hypothesis (Fig. 3d). Pure dust regimes of aerosol, due to their high level of non-spherical particles, produce higher LDR (Groß et al., 2011). The C1 cluster presents higher values of LDR than C0, indicating that C1 is closer to a pure dust regime. The C0, while a dust regime, is likely to represent a mixed scenario given its LDR values consistent with dust and smoke mixing (Kanitz et al., 2013). LDR values below 15 %, which is the case of the clusters C2, C3, and C4, are typically associated with fresh/aged smoke, urban-industrial pollution, and marine particles scenarios. The analysis of the real part versus the imaginary part of the complex refractive index (Fig. 3c) emphasizes C2 as the aerosol regime with the largest absorption and highlights that the real part of the complex refractive index is the main aspect differentiating C3 and C4.</p>

      <fig id="F3" specific-use="star"><label>Figure 3</label><caption><p id="d2e1586">Scatterplot of the clusters elements  as function of different parameters: <bold>(a)</bold> extinction Angstrom Exponent (AE) as function of Aerosol Optical Depth (AOD) at 440 nm; <bold>(b)</bold> Asymmetry Parameter (ASY) as function of Single Scattering Albedo (SSA) at 440 nm; <bold>(c)</bold> Lidar Ratio as a function of Linear Depolarization Ratio at 1020 nm; <bold>(d)</bold> refractive index at 440 nm: imaginary part as function of Real part.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f03.png"/>

        </fig>

      <p id="d2e1607">Figures 4 and 5 present the clusters averages for selected features: size distribution, complex refractive index, single scattering albedo, and asymmetry parameter. A more detailed summary of the mean behavior of the clusters is presented in Table 3. The average size distribution of the clusters confirms that aerosol regimes affecting the Iberian Peninsula vary between two scenarios dominated by coarse mode (C0, C1), named here as dust regimes, and three scenarios when coarse mode is not dominant, here considered as non-dust regimes. There are differences between the dust regimes: C1 is associated with a higher coarse particle loading than C0. Among the non-dust regimes (C2, C3, and C4), the main difference is seen between C2 and the other two. C2 is characterized by a larger fine particle loading. Between C3 and C4, one can observe a larger radius spread for C3 regarding the contribution of the fine mode, which indicates a potential growth of particles via processes such as water uptake, aging, and coagulation, or that the aerosol regime mixture includes sources that naturally produce slightly larger fine particles. These features usually indicate more aged, more hygroscopic, or more humidified aerosol compared to freshly emitted, dry fine particles.</p>

      <fig id="F4" specific-use="star"><label>Figure 4</label><caption><p id="d2e1612">Clusters mean volume particle size distribution as a function of radius. These size distributions correspond to the average of the instantaneous size distributions retrieved by AERONET from each identified cluster. The numeric values of each cluster size distribution can be found in Table S2.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f04.png"/>

        </fig>

      <fig id="F5" specific-use="star"><label>Figure 5</label><caption><p id="d2e1624">Clusters average of complex refractive index, <bold>(a)</bold> real and <bold>(b)</bold> imaginary parts, <bold>(c)</bold> single scattering albedo and <bold>(d)</bold> asymmetry parameter.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f05.png"/>

        </fig>

<table-wrap id="T3" specific-use="star"><label>Table 3</label><caption><p id="d2e1648">Summary of the clusters based on the average of optical and microphysical properties. A detailed description of the clusters can be found in Tables S1 and S2. The values in the brackets correspond to standard deviation.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="6">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Properties</oasis:entry>
         <oasis:entry colname="col2">Cluster0</oasis:entry>
         <oasis:entry colname="col3">Cluster1</oasis:entry>
         <oasis:entry colname="col4">Cluster2</oasis:entry>
         <oasis:entry colname="col5">Cluster3</oasis:entry>
         <oasis:entry colname="col6">Cluster4</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">(polluted</oasis:entry>
         <oasis:entry colname="col3">(pure</oasis:entry>
         <oasis:entry colname="col4">(strongly</oasis:entry>
         <oasis:entry colname="col5">(Urban-</oasis:entry>
         <oasis:entry colname="col6">(moderately</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">dust)</oasis:entry>
         <oasis:entry colname="col3">dust)</oasis:entry>
         <oasis:entry colname="col4">absorbing</oasis:entry>
         <oasis:entry colname="col5">industrial</oasis:entry>
         <oasis:entry colname="col6">absorbing</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4">smoke)</oasis:entry>
         <oasis:entry colname="col5">pollution)</oasis:entry>
         <oasis:entry colname="col6">smoke)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Number of records</oasis:entry>
         <oasis:entry colname="col2">1308</oasis:entry>
         <oasis:entry colname="col3">1665</oasis:entry>
         <oasis:entry colname="col4">153</oasis:entry>
         <oasis:entry colname="col5">660</oasis:entry>
         <oasis:entry colname="col6">609</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Percentage (%)</oasis:entry>
         <oasis:entry colname="col2">29.76</oasis:entry>
         <oasis:entry colname="col3">37.88</oasis:entry>
         <oasis:entry colname="col4">3.48</oasis:entry>
         <oasis:entry colname="col5">15.01</oasis:entry>
         <oasis:entry colname="col6">13.74</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Ref_Idx_Real (440 nm)</oasis:entry>
         <oasis:entry colname="col2">1.47 (0.04)</oasis:entry>
         <oasis:entry colname="col3">1.44 (0.03)</oasis:entry>
         <oasis:entry colname="col4">1.51 (0.07)</oasis:entry>
         <oasis:entry colname="col5">1.43 (0.06)</oasis:entry>
         <oasis:entry colname="col6">1.52 (0.05)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Ref_Idx_Img (440 nm)</oasis:entry>
         <oasis:entry colname="col2">0.005 (0.002)</oasis:entry>
         <oasis:entry colname="col3">0.004 (0.001)</oasis:entry>
         <oasis:entry colname="col4">0.025 (0.009)</oasis:entry>
         <oasis:entry colname="col5">0.006 (0.004)</oasis:entry>
         <oasis:entry colname="col6">0.009 (0.004)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">VMR-F</oasis:entry>
         <oasis:entry colname="col2">0.14 (0.03)</oasis:entry>
         <oasis:entry colname="col3">0.14 (0.03)</oasis:entry>
         <oasis:entry colname="col4">0.16 (0.02)</oasis:entry>
         <oasis:entry colname="col5">0.21 (0.04)</oasis:entry>
         <oasis:entry colname="col6">0.18 (0.04)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">STD-F</oasis:entry>
         <oasis:entry colname="col2">0.61 (0.09)</oasis:entry>
         <oasis:entry colname="col3">0.67 (0.07)</oasis:entry>
         <oasis:entry colname="col4">0.42 (0.06)</oasis:entry>
         <oasis:entry colname="col5">0.47 (0.06)</oasis:entry>
         <oasis:entry colname="col6">0.41 (0.05)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">REff-F</oasis:entry>
         <oasis:entry colname="col2">0.12 (0.02)</oasis:entry>
         <oasis:entry colname="col3">0.12 (0.02)</oasis:entry>
         <oasis:entry colname="col4">0.14 (0.02)</oasis:entry>
         <oasis:entry colname="col5">0.18 (0.03)</oasis:entry>
         <oasis:entry colname="col6">0.17 (0.03)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">REff-C</oasis:entry>
         <oasis:entry colname="col2">1.68 (0.16)</oasis:entry>
         <oasis:entry colname="col3">1.61 (0.13)</oasis:entry>
         <oasis:entry colname="col4">2.44 (0.43)</oasis:entry>
         <oasis:entry colname="col5">2.31 (0.38)</oasis:entry>
         <oasis:entry colname="col6">2.25 (0.49)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">VMR-C</oasis:entry>
         <oasis:entry colname="col2">2.02 (0.23)</oasis:entry>
         <oasis:entry colname="col3">1.88 (0.17)</oasis:entry>
         <oasis:entry colname="col4">3.10 (0.45)</oasis:entry>
         <oasis:entry colname="col5">2.82 (0.42)</oasis:entry>
         <oasis:entry colname="col6">2.82 (0.57)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">STD-C</oasis:entry>
         <oasis:entry colname="col2">0.60 (0.52)</oasis:entry>
         <oasis:entry colname="col3">0.54 (0.04)</oasis:entry>
         <oasis:entry colname="col4">0.68 (0.06)</oasis:entry>
         <oasis:entry colname="col5">0.63 (0.05)</oasis:entry>
         <oasis:entry colname="col6">0.67 (0.05)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">AOD (440 nm)</oasis:entry>
         <oasis:entry colname="col2">0.50 (0.11)</oasis:entry>
         <oasis:entry colname="col3">0.58 (0.21)</oasis:entry>
         <oasis:entry colname="col4">0.64 (0.29)</oasis:entry>
         <oasis:entry colname="col5">0.48 (0.09)</oasis:entry>
         <oasis:entry colname="col6">0.51 (0.13)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">SSA (440 nm)</oasis:entry>
         <oasis:entry colname="col2">0.91 (0.03)</oasis:entry>
         <oasis:entry colname="col3">0.91 (0.02)</oasis:entry>
         <oasis:entry colname="col4">0.86 (0.03)</oasis:entry>
         <oasis:entry colname="col5">0.95 (0.03)</oasis:entry>
         <oasis:entry colname="col6">0.94 (0.03)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">ASY (440 nm)</oasis:entry>
         <oasis:entry colname="col2">0.76 (0.02)</oasis:entry>
         <oasis:entry colname="col3">0.79 (0.19)</oasis:entry>
         <oasis:entry colname="col4">0.67 (0.03)</oasis:entry>
         <oasis:entry colname="col5">0.73 (0.03)</oasis:entry>
         <oasis:entry colname="col6">0.69 (0.02)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">AE (440/870 nm)</oasis:entry>
         <oasis:entry colname="col2">0.40 (0.25)</oasis:entry>
         <oasis:entry colname="col3">0.24 (0.14)</oasis:entry>
         <oasis:entry colname="col4">1.67 (0.20)</oasis:entry>
         <oasis:entry colname="col5">1.43 (0.26)</oasis:entry>
         <oasis:entry colname="col6">1.47 (0.25)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">LR (1020 nm)</oasis:entry>
         <oasis:entry colname="col2">64 (9)</oasis:entry>
         <oasis:entry colname="col3">70 (8)</oasis:entry>
         <oasis:entry colname="col4">89 (16)</oasis:entry>
         <oasis:entry colname="col5">77 (17)</oasis:entry>
         <oasis:entry colname="col6">61 (15)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">LDPR (440 nm)</oasis:entry>
         <oasis:entry colname="col2">0.17 (0.04)</oasis:entry>
         <oasis:entry colname="col3">0.21 (0.04)</oasis:entry>
         <oasis:entry colname="col4">0.01 (0.03)</oasis:entry>
         <oasis:entry colname="col5">0.03 (0.04)</oasis:entry>
         <oasis:entry colname="col6">0.03 (0.05)</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e2112">Clusters C2 and C4 have close values for the real part of the refractive index, but cluster C2 has a much larger imaginary part, justifying its lowest SSA (Fig. 5). The C2 strong absorption combined with its smaller particles suggests that it is likely associated with fresh smoke (Reid and Hobbs, 1998; Reid et al., 2005). The average of the real part of the complex refractive index corroborates the difference between the C3 and C4 aerosol regimes. According to Moise et al. (2015), a variation as such observed between C3 and C4 (1.4 to 1.5) could produce an increment of 12 % in estimating the direct aerosol radiative forcing over the solar spectrum wavelength range. Zhao et al. (2019) also showed that the direct aerosol radiative forcing is estimated to vary by 40 % when the real part of the complex index values varies between 1.36 and 1.56. The reasons for the differences observed between the real parts of C3 and C4 remain unclear. However, the spatial distribution of the clusters (see Fig. 6) indicates that C3 is more prevalent in the eastern region of the Iberian Peninsula, which is the wettest area and more exposed to air masses from the Mediterranean and Eastern Europe. Additionally, the low values of the real part of the complex refractive index for C3 align with aerosol regimes that have a strong contribution from sulfate particles. The spectral dependency of the single scattering albedo corroborates our attribution of the C0 and C1 to a dust regime. Dust particles are characterized by strong absorption in the UV spectrum (Dubovik et al., 2002), which decreases as the wavelength increases, a feature present in both C0 and C1. Also, consistent with dust-dominated regimes, C0 and C1 have the largest mean asymmetry parameters at all wavelengths.</p>

      <fig id="F6"><label>Figure 6</label><caption><p id="d2e2117">Proportions of the occurrence of the clusters of aerosol regimes at the AERONET sites across the Iberian Peninsula.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f06.png"/>

        </fig>

      <fig id="F7" specific-use="star"><label>Figure 7</label><caption><p id="d2e2129">Clusters relative monthly occurrence over the AERONET sites representatives of the Iberian Peninsula western lowlands (Evora), highlands plateau (Madrid) and southeast lowlands (El Arenosillo, Granada).</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f07.png"/>

        </fig>

      <p id="d2e2138">The analysis above and the summary provided by Table 3 provide several specific characteristics that help us to contextualize the clusters. To enhance this understanding, we add the spatial (Fig. 6) and seasonal (Fig. 7) distribution of the clusters into our analysis. C0 and C1 aerosol regimes are dominated by dust, where C1 is the closest regime to what we could call a pure dust scenario. Both aerosol regimes, C0 and C1, affect practically the entire Peninsula (Fig. 6) and all year round, but it is more frequent in the southern part of the Peninsula, an expected feature considering that the dust particles are mainly transported from North Africa (Cachorro et al., 2016; Gómez-Amo et al., 2017). The C2 cluster is the most absorbing regime and is characterized by the smallest fine mode particles (Table 3). Its spatial distribution (Fig. 6), with more frequent occurrence along the belt spanning from Evora, in Portugal, to Caceres, in Spain, a region known for high recurrence of biomass burning, reinforces our hypothesis. Additionally, the seasonal distribution of C2 in this region coincides with the peak of the biomass burning season. The C3 aerosol regime also occurs over all AERONET sites throughout the year, but it is dominant in the eastern and northeastern portions of the Iberian Peninsula. Among non-dust regimes, its unique feature is its very low real part of the refractive index. C4, as C3, is weakly absorbing according to its single scattering albedo. C4 is present across the entire Peninsula, but its occurrence increases in the central and northern portions, which are more prone to biomass burning. An important feature of C4 is that its occurrence increases during the summer and the beginning of autumn (Fig. 7) in the central region of the Iberian Peninsula, from Évora (Portugal) to Madrid (Spain), when the region's biomass burning season is underway. These aspects led us to hypothesize that C4 is an aerosol regime under the strong influence of smoke aerosol particles.</p>
      <p id="d2e2141">Figures 7 and 8 provide a perspective view on the seasonal occurrence of each cluster based on sites that represent different regions of the Iberian Peninsula.</p>

      <fig id="F8" specific-use="star"><label>Figure 8</label><caption><p id="d2e2146">Clusters relative monthly occurrence over the AERONET sites representatives of the following Iberian Peninsula regions: Eastern Coast (Barcelona, Burjassot) and Northern (Coruna, CENER).</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f08.png"/>

        </fig>

</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title>Random Forest classifier: performance and optical models spatial dynamic</title>
      <p id="d2e2163">The Random Forest training of MERRA-2 aerosol-type column mass density as predictors of aerosol optical regime covered 70 % of the AERONET sky inversions used in this study, combining datasets from all sites. The testing dataset, constituted by the remaining 30 %, was used to evaluate the model's performance. The best parameters obtained from the optimization using RandomizedSearchCV were the number of decision trees of 477 (n_estimators <inline-formula><mml:math id="M81" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 477) and the maximum depth of trees of 19 (max_depth <inline-formula><mml:math id="M82" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 19). There are several metrics for assessing machine learning performance. Figure 9 presents the one used in this study, the Normalized Confusion Matrix (NCM), which expresses the percentage of correct and incorrect predictions (where the classifier got confused). In the matrix, the rows represent the true labels, and the columns represent the predicted ones. The values along the diagonal indicate the percentage of times where the predicted matches the true label. The other cells reflect instances where the classifier mislabeled an observation; the column tells us what the classifier predicted, and the row tells us the correct label.</p>

      <fig id="F9" specific-use="star"><label>Figure 9</label><caption><p id="d2e2182">Normalized confusion matrix of the Random Forest classifier applied to the prediction of the clusters that describe the typical aerosol optical regime based on MERRA-2 aerosol components column mass density.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f09.png"/>

        </fig>

      <p id="d2e2191">For all clusters, the classifier's correct predictions surpassed the incorrect predictions, with a maximum frequency of correct predictions close to 80 % obtained for C1. The minimum percentage of correct prediction, about 60 %, was obtained for C2, the highest absorbing cluster. Regarding dust regime clusters, despite the struggle to predict C0, it is possible to see that, in this case, the classifier's main confusion is with the C1, which is also a cluster related to an aerosol scenario dominated by coarse mode particles (dust regime), as with C0. The classifier's confusion in this case is between the two dust-regime models; therefore, the induced error in optical properties prescription would be lower than that if the confusion was between a dust and a non-dust regime, especially like C2, which is substantially different from any of the dust regimes. Rarely does the classifier take either C0 or C1 as C2, C3, and C4, a case where substantial error in the optical properties prescription would be expected. By combining C0 and C1 results in the NCM, the percentage of correct predictions achieved by the classifier indicating dust regime is higher than 95 %. Similarly, the classifier rarely takes C3 and C4 as C0, C1, and C2. Given that C3 and C4 are also close in terms of their optical properties, especially concerning absorption, some degree of confusion among them is expected. Nevertheless, these aspects of the confusion matrix among close clusters are important to identify where the model needs extra training, for instance, considering longer time series when available and adding new and relevant predictors, such as Brown Carbon, an important aerosol component not available in the current MERRA-2 aerosol reanalysis products. C2, the least frequent and the one representing the most absorbing aerosol regime over the Iberian Peninsula, is rarely mislabeled as C0 or C1, but often mislabeled as C3 or C4. Still, the score percentage is around 60 %.</p>

      <fig id="F10" specific-use="star"><label>Figure 10</label><caption><p id="d2e2198">Relative importance of the predictor variables, i.e. the degree of influence of each aerosol-type column mass density on the model decision-making. dst – Dust, oac – Organic Carbon, ssl – Sea-Salt, SO<sub>2</sub> – Sulfate SO<sub>2</sub> – Sulfur dioxide (precursor of SO<sub>4</sub>), bcc – Black Carbon.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f10.png"/>

        </fig>

      <p id="d2e2234">To provide further insight into the model performance, we also examined other metrics commonly used to evaluate Random Forest training. Precision, Recall, and <inline-formula><mml:math id="M86" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> score were calculated for both scenarios, the trained model applied to the test and to the train dataset (Table 4). The results indicate that the model generalizes well, without significant overfitting. Even for Cluster 2, which has a small number of occurrences, the model was able to maintain high precision and score. The general accuracy did not drop critically for the test data (0.70) when compared with the train dataset (0.88), another indicator of the model's ability to generalize. The trained model applied to the test dataset achieved a general accuracy of 70 %, meaning it correctly predicted the aerosol regime in three out of four cases. For all clusters, all metrics adopted were higher than 0.60, with precision and recall values exceeding 0.75 in some cases. The precision metric indicates how often the positive predictions are correct. The model precision varied within the specific optical regimes (ex., non-dust) and among optical regimes (dust, non-dust). It showed higher precision in identifying C1 than C0, the two dust regimes. Among the non-dust regime clusters, the lowest precision obtained was 0.62 for the prediction of C2; nevertheless, this precision is still a promising outcome considering the limited number of samples of this cluster available for the training process. Given its strong absorption nature, mislabeling the C2 aerosol regime would translate into high error in optical properties prescription; therefore, as mentioned, extra training is required to improve the model prediction for C2 occurrence.</p>

<table-wrap id="T4"><label>Table 4</label><caption><p id="d2e2251">Performance metrics values of the trained model applied to the test and the train (within parenthesis) dataset to predict aerosol optical regimes based on aerosol-type column mass density.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="5">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="center"/>
     <oasis:colspec colnum="3" colname="col3" align="center"/>
     <oasis:colspec colnum="4" colname="col4" align="center"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Clusters</oasis:entry>
         <oasis:entry colname="col2">Precision</oasis:entry>
         <oasis:entry colname="col3">Recall</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M87" display="inline"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>-score</oasis:entry>
         <oasis:entry colname="col5">Support (<inline-formula><mml:math id="M88" display="inline"><mml:mi>N</mml:mi></mml:math></inline-formula>)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">0</oasis:entry>
         <oasis:entry colname="col2">0.62 (0.89)</oasis:entry>
         <oasis:entry colname="col3">0.62 (0.78)</oasis:entry>
         <oasis:entry colname="col4">0.62 (0.83)</oasis:entry>
         <oasis:entry colname="col5">361 (909)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">1</oasis:entry>
         <oasis:entry colname="col2">0.68 (0.86)</oasis:entry>
         <oasis:entry colname="col3">0.70 (0.94)</oasis:entry>
         <oasis:entry colname="col4">0.69 (0.90)</oasis:entry>
         <oasis:entry colname="col5">517 (1130)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">2</oasis:entry>
         <oasis:entry colname="col2">0.62 (0.92)</oasis:entry>
         <oasis:entry colname="col3">0.60 (0.76)</oasis:entry>
         <oasis:entry colname="col4">0.61 (0.83)</oasis:entry>
         <oasis:entry colname="col5">47 (106)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">3</oasis:entry>
         <oasis:entry colname="col2">0.76 (0.93)</oasis:entry>
         <oasis:entry colname="col3">0.73 (0.94)</oasis:entry>
         <oasis:entry colname="col4">0.74 (0.94)</oasis:entry>
         <oasis:entry colname="col5">206 (429)</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">4</oasis:entry>
         <oasis:entry colname="col2">0.68 (0.91)</oasis:entry>
         <oasis:entry colname="col3">0.69 (0.93)</oasis:entry>
         <oasis:entry colname="col4">0.69 (0.92)</oasis:entry>
         <oasis:entry colname="col5">162 (442)</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e2401">Figure 10 illustrates the relative importance of the predictor variables for the grids consisting of the AERONET sites, highlighting the influence of each aerosol-type column mass density on the model's decision-making. The results indicate that the presence of dust over the Iberian Peninsula is the primary factor affecting the aerosol optical properties in this region. This finding aligns with actual conditions, as the transport of Saharan dust to the peninsula is the main driver of aerosol optical properties variability in the area. Dust is followed by organic carbon, sea salt, and sulfate aerosol types. Organic carbon relevance is associated with biomass burning, a critical aerosol source during the dry season. Interestingly, black carbon column mass density did not rank among the top predictors. Despite the expectation that black carbon might serve as a significant indicator of the aerosol optical regime due to its association with smoke-influenced aerosols. There is considerable uncertainty in black carbon simulations in atmospheric chemistry models, including reanalyses such as MERRA-2, which may hinder its effectiveness in predicting the aerosol regime observed at AERONET monitoring sites.</p>
      <p id="d2e2404">We also managed to calculate the relative importance of the predictors from Table 1 in the cluster prediction; the result is presented in the supplement (Fig. S2). Consistency can be observed between the score scale from Fig. S2 and that derived from MERRA-2 with respect to aerosol types (Fig. 10). In Fig. 10, dust (dst) mass variability emerges as the most influential factor in determining which cluster should be applied. In the Fig. S2 figure, which presents the importance of the optical parameters from Table 1 for clustering, the scores appear well distributed, with a maximum value close to 0.1. Nevertheless, it is evident that higher wavelengths (near-infrared at 870 and 1020 nm) and specific optical parameters – namely the Asymmetry Parameter and the Linear Depolarization Ratio – exhibit the greatest importance, as they are most effective in distinguishing dust from other aerosol types.</p>
</sec>
<sec id="Ch1.S3.SS3">
  <label>3.3</label><title>Application: case studies</title>
      <p id="d2e2415">From the testing dataset, we selected some case studies that significantly impacted local populations, garnered media attention, and represented different aerosol scenarios in the Iberian Peninsula. This selection provides a visual (qualitative) demonstration of the model's predicting capability (Table 5).</p>

<table-wrap id="T5"><label>Table 5</label><caption><p id="d2e2421">List of case studies of aerosols high loading events over Iberian Peninsula selected to highlight as examples of the classifier trained model application.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="3">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Case study</oasis:entry>
         <oasis:entry colname="col2">Date</oasis:entry>
         <oasis:entry colname="col3">Nature</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">(reference</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">link)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">01</oasis:entry>
         <oasis:entry colname="col2">27 June 2023</oasis:entry>
         <oasis:entry colname="col3">Smoke<sup>1</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">02</oasis:entry>
         <oasis:entry colname="col2">16 October 2017</oasis:entry>
         <oasis:entry colname="col3">Dust and Smoke<sup>2</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">03</oasis:entry>
         <oasis:entry colname="col2">11 August 2016</oasis:entry>
         <oasis:entry colname="col3">Smoke<sup>3</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">04</oasis:entry>
         <oasis:entry colname="col2">17 March 2022</oasis:entry>
         <oasis:entry colname="col3">Dust<sup>4</sup></oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table><table-wrap-foot><p id="d2e2424"><sup>1</sup> <uri>https://earthobservatory.nasa.gov/images/151507/canadian-smoke-reaches-europe</uri> (last access: 1 April 2026); <sup>2</sup> <uri>https://atmosphere.copernicus.eu/saharan-dust-and-smoke-over-france-and-uk</uri> (last access: 1 April 2026); <sup>3</sup> <uri>https://earthobservatory.nasa.gov/images/88552/fires-rage-in-portugal</uri> (last access: 1 April 2026); <sup>4</sup> <uri>https://earthobservatory.nasa.gov/images/149645/dusty-storm-clouds-over-europe</uri> (last access: 1 April 2026).</p></table-wrap-foot></table-wrap>

      <fig id="F11" specific-use="star"><label>Figure 11</label><caption><p id="d2e2606">Case studies of distinct aerosol scenarios over the Iberian Peninsula selected to test our machine-learning based approach to predict the best optical property regime: <bold>(a, b)</bold> Case 01 on 27 June 2023; <bold>(c, d)</bold> Case 02 on 16 October 2017; <bold>(e, f)</bold> Case 03 on 11 August 2016; <bold>(g, h)</bold> Case 04 on 17 March 2022. On the left side, MODIS Terra and Aqua/NASA True color satellite images (<uri>https://wvs.earthdata.nasa.gov</uri>, last access: 1 April 2026); and on the right the cluster spatial distribution prescribed by the model.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f11.jpg"/>

        </fig>

      <p id="d2e2631">We set our trained model to prescribe the spatial distribution of aerosol optical regimes (clusters) that best fit various scenarios based on MERRA-2 aerosol-type column mass density. The results for all cases studied are presented in Fig. 11. To minimize uncertainties associated with the estimates of aerosol absorptivity, AERONET SSA retrievals are limited to cases where the AOD at 440 nm exceeds 0.4 (Dubovik and King, 2000; Holben et al., 2006). Therefore, the discussion of the optical regime prescriptions was focused on areas where AOD was above this threshold. The uncertainty in retrieved SSA is <inline-formula><mml:math id="M97" display="inline"><mml:mrow><mml:mo>∼</mml:mo><mml:mn mathvariant="normal">0.03</mml:mn></mml:mrow></mml:math></inline-formula> at AOD at 440 nm <inline-formula><mml:math id="M98" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.4 and decreases at higher AOD levels (Sinyuk et al., 2020).</p>
      <p id="d2e2651">For our regional analysis, we used the MERRA-2 AOD field as a reference, since AERONET provides local AOD at specific sites. Figure S1 in the Supplement exhibits as example the seasonal cycle aerosol AOD at 550 nm over the Iberian Peninsula. Given that the prescription is done based on a map of the combination of aerosol types column density from models, in this case MERRA-2, the only way to filter areas across the Iberian Peninsula where AOD at 440 nm <inline-formula><mml:math id="M99" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> 0.4 is to use the AOD field from MERRA-2.</p>
      <p id="d2e2661">Case 01 occurred from 1 to 25 June 2023, coinciding with large-scale wildfire events in Quebec, Canada. A substantial portion of smoke from these wildfires crossed the Atlantic Ocean and reached Western Europe, especially the Iberian Peninsula, resulting in darkened skies in the affected countries. Our trained model predicted that the most suitable aerosol optical regime for the areas impacted by the smoke (Portugal, Western, and Northern Spain) is C4, which corroborates our previous discussion associating the C4 optical regime with regional smoke.</p>
      <p id="d2e2664">Case 02 features an emblematic event on 16 October 2017, marked by a simultaneous massive wildfire in central and northern Portugal and a strong dust transport from North Africa via the south of Portugal. The path connecting the smoke and dust produced a strong northward transport affecting the United Kingdom, influenced by the synoptic conditions associated with the ex-hurricane Ophelia, located just north of the Iberian Peninsula (Osborne et al., 2019). The optical regime prescription identified the C4 cluster as the appropriate regime from central Portugal northward to the UK. Meanwhile, the area affected by dust, spanning from North Africa to southern and central Portugal, was characterized by a mix of C0 and C1, the clusters associated with dust regimes. As the dust plume arrived in Portugal, the model indicated a gradual transition from C1, indicative of pure dust, to C0, which represents conditions of dust mixed with smoke (Gómez-Amo et al., 2017). The random distribution of C2 within the larger C4 regions likely reflects the model's response to the specific conditions dictated by the aerosol-type column mass densities. This could suggest patches of high-absorbing aerosol-type within a less-absorbing large-scale smoke plume, although there is insufficient evidence to draw definitive conclusions.</p>
      <p id="d2e2667">Case 03, dated 11 August 2016, involved strong wildfire emissions in northern Portugal. Most of the smoke was transported toward the Atlantic Ocean, while the remainder of the peninsula experienced low aerosol loading conditions. Consistent with fresh smoke aerosol scenarios, the model prescribed the C2 optical regime, the highest absorbing cluster. In strong biomass burning events, especially at the early stage of the emission process, the ratio of elemental carbon to organic carbon is usually high, which has been shown to explain the high absorption features of fresh smoke plume (Schwink et al., 2024). Additionally, previous studies have also shown that Brown Carbon (BrC) absorption is strongest in fresh smoke plumes and decreases with atmospheric processing (Saleh et al., 2014; Pokhrel et al., 2017).</p>
      <p id="d2e2670">Case 04 pertains to an extreme Saharan dust transport that affected most of the Iberian Peninsula on 15–17 March 2022. During this event, the 24 h average concentration of PM2.5 reached as high as 700 <inline-formula><mml:math id="M100" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>g m<sup>−3</sup> in parts of Spain (Rodríguez and López-Darias, 2024). The pollution episode was dominated by dust, and indeed, the model prescribed the optical regimes C0 and C1, which indicate pure dust and dusty conditions for most of the Iberian Peninsula. This demonstrates our approach's capability to differentiate specific scenarios within dust regimes. For non-dust regimes such as C2, a highly absorbing regime, we would not expect to see widespread prescriptions, as we hypothesize that it is associated with fresh, high-absorbing pollution plumes.</p>

      <fig id="F12" specific-use="star"><label>Figure 12</label><caption><p id="d2e2696">Single Scattering Albedo (SSA) prescription based on the current study approach <bold>(a, c, e, g)</bold> and that simulated by MERRA-2 <bold>(b, d, f, h)</bold> for the selected case studies of Table 5: <bold>(a, b)</bold> Case 01 on 27 June 2023; <bold>(c, d)</bold> Case 02 on 16 October 2017; <bold>(e, f)</bold> Case 03 on 11 August 2016; <bold>(g, h)</bold> Case 04 on 17 March 2022.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f12.png"/>

        </fig>

      <p id="d2e2724">Figure 6, depicting the occurrence of each cluster across the Iberian Peninsula, corroborates our hypothesis by indicating that the C2 regime is mainly present in specific areas where aerosol loading increases are primarily attributed to biomass burning, such as the western lowlands of the Iberian Peninsula (Evora, Badajoz, and Caceres) and in the Galicia region (Coruna). The C3 optical regime was not linked to large-scale dust transport or smoke plumes across the Iberian Peninsula, suggesting it might be associated with high levels of local or regional pollution. Figure 6 shows that the C3 regime is commonly observed throughout the year in the eastern portion of the Iberian Peninsula. The results of these case studies, combined with performance evaluations, highlight the capability and potential of this machine-learning approach, which uses clustering and random forest classification to prescribe optical models from aerosol-type columnar mass density to calculate aerosol particles' direct radiative effect in atmospheric models. By constraining modelling with observational aerosol optical data, we can help mitigate the known uncertainties related to aerosol direct radiative forcing.</p>

      <fig id="F13" specific-use="star"><label>Figure 13</label><caption><p id="d2e2729">Current study prescription and MERRA-2 simulation of Single Scattering Albedo (SSA) frequency distribution as function of the optical regime (clusters): <bold>(a)</bold> Cluster 0; <bold>(b)</bold> Cluster 1; <bold>(c)</bold> Cluster 3; <bold>(d)</bold> Cluster 4. The dashed lines represent the mean values.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f13.png"/>

        </fig>

      <p id="d2e2750">Figure 12 shows the single scattering albedo at 550 nm, comparing the current approach and MERRA-2 reanalysis results. The MERRA-2 columnar total SSA was calculated based on the ratio of total scattering aerosol optical depth to total extinction aerosol optical depth, both provided in MERRA-2 aerosol products. For smoke scenarios on 27 June 2023, MERRA-2 indicated a more absorbing optical regime (SSA at 550 nm <inline-formula><mml:math id="M102" display="inline"><mml:mo>∼</mml:mo></mml:math></inline-formula> 0.86–0.90) compared to the current approach (SSA at 550 nm <inline-formula><mml:math id="M103" display="inline"><mml:mo>∼</mml:mo></mml:math></inline-formula> 0.95). On this day, the average SSA at 550 nm over the AERONET site in Coruna City, which was directly affected by Canadian smoke, exceeded 0.95. The opposite was observed for the strong smoke emission event that occurred over northern Portugal on 11 August 2016. Current strategy prescribed a much lower SSA, therefore the strongest absorbing regime, when compared with the MERRA-2 calculation. Due to the absence of a site in the northern part of Portugal, we were not able to compare the prescribed and simulated values with AERONET data. For the dust scenario, on 17 March 2022, the current approach prescribed a less absorbing optical regime (SSA at 550 nm <inline-formula><mml:math id="M104" display="inline"><mml:mo>∼</mml:mo></mml:math></inline-formula> 0.94–0.95) compared to MERRA-2, which reported a SSA at 550 nm of roughly 0.92–0.94. The analysis of SSA at 550 nm over AERONET sites affected by the dust event surpassed 0.94. While these cases highlight differences between the prescriptions based on the clusters and MERRA-2 results, they are only sufficient to warrant further investigation. To gain a statistical perspective on whether the findings from these case studies are isolated incidents or indicative of a trend, we compare a much larger sample of MERRA-2 SSA at 550 nm across various AERONET sites in the Iberian Peninsula using the clusters approach. We focused only on MERRA-2 aerosol scenarios for AOD at 550 nm larger than 0.3, which correspond to AOD higher than 0.4 at 440 nm previously mentioned, and conducted the comparison segmented by the optical regimes defined by the clusters.</p>

      <fig id="F14" specific-use="star"><label>Figure 14</label><caption><p id="d2e2776">Current study prescription and MERRA-2 simulation of Angstrom Exponent (AE) frequency distribution as function of the optical regime (clusters): <bold>(a)</bold> Cluster 0; <bold>(b)</bold> Cluster 1; <bold>(c)</bold> Cluster 3; <bold>(d)</bold> Cluster 4. The dashed lines represent the mean values.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f14.png"/>

        </fig>

      <fig id="F15" specific-use="star"><label>Figure 15</label><caption><p id="d2e2800">Current study prescription and MERRA-2 simulation of <bold>(a)</bold> Single Scattering Albedo and <bold>(b)</bold> Angstrom Exponent (AE) frequency distribution for the Cluster 2 scenario. The dashed lines represent the mean values.</p></caption>
          <graphic xlink:href="https://gmd.copernicus.org/articles/19/2691/2026/gmd-19-2691-2026-f15.png"/>

        </fig>

      <p id="d2e2815">Figure 13 shows the count distribution of MERRA-2 SSA at 550 nm for the aerosol regimes represented by the clusters C0, C1, C3, and C4, as classified by the random forest classifier we developed. Histograms of clusters of SSA at 550 nm presented in Fig. 13 were generated following a Gaussian distribution, considering the cluster average as the central value of each optical regime cluster and standard deviation as the typical spread. A similar analysis was conducted for the Angstrom Exponent (Fig. 14) to evaluate aspects related to particle size distribution. Based on Fig. 13, we found that, on average, our aerosol optical regime prescription based on the clusters (AERONET) is less absorbing than MERRA-2 for aerosol regimes C0, C1, C3, and C4. More significant differences are observed for C1, C3, and C4. Cluster C1 corresponds to a dust scenario closer to pure dust, while C4 is dominated by smoke. Regarding the particle size indicator (AE), it was observed that MERRA-2 has a lower contribution of coarse particles in the dust regimes compared to the cluster-based prescriptions (Fig. 14a and b). This finding aligns with Adebiyi et al. (2023), who noted that climate models tend to underestimate large dust particles, mainly when representing North African dust plumes. Conversely, for the non-dust regimes (C3, C4), MERRA-2 shows a larger relative contribution of coarse particles than the clusters-based prescription (Fig. 14c and d). Figure 15 shows the results for C2. For this specific regime, on average, prescriptions based on the cluster (AERONET) are more absorbing than MERRA-2, opposite to the findings of the other clusters. Regarding AE, under the C2 regime, MERRA-2's mean AE is lower than that prescribed from the cluster, suggesting a lower relative contribution of fine mode in the reanalysis simulations. This is similar to the findings related to the two other fine-mode dominant regimes (C3 and C4).</p>
      <p id="d2e2818">As demonstrated by the SSA and AE distributions (Fig. 13–15) and evaluated from Tables 1 and 4, the model can also predict the occurrence of the minority cluster C2 (3 %–4 % of samples). The model preserves the distribution of optical properties of less frequent aerosol regimes while capturing MERRA-2 features without the need for explicit class imbalance treatment, with C2's highly absorbing and dominant fine mode conditions reflected in both SSA and AE predictions, with the distributions of values across clusters showing coherence with MERRA-2 values. With C2's highly absorbing and dominant fine mode conditions reflected in both SSA and AE predictions, the distributions across clusters demonstrate agreement between expected and observed distribution values.</p>
</sec>
</sec>
<sec id="Ch1.S4" sec-type="conclusions">
  <label>4</label><title>Conclusions</title>
      <p id="d2e2830">This study emphasizes the importance of observational-based research to constrain the prescription of aerosol-intensive properties in atmospheric models. We aimed to characterize the typical aerosol intensive optical properties affecting the Iberian Peninsula (IP) using data from the atmospheric column AERONET sky inversion products. We employed <inline-formula><mml:math id="M105" display="inline"><mml:mi>K</mml:mi></mml:math></inline-formula>-means clustering to analyze historical aerosol intensive properties across all AERONET sites that operated for at least two years and had the highest quality dataset level (2.0) available. We identified five distinct clusters (C0, C1, C2, C3, and C4) representing different optical regimes, illustrating the predominant aerosol scenarios in the IP. The key difference among these clusters lies in the contribution of coarse-mode particles and their absorption efficiency. Clusters C0 and C1 are dominated by coarse-mode particles and classified as dust regimes due to their association with Saharan dust transport. In particular, the optical properties of C1 closely resemble a pure dust scenario, while C0 indicates a more mixed situation, which we refer to as dusty. On the other hand, clusters C2 and C4 are identified as non-dust regimes, linked to strong and moderate absorption related to smoke plumes. Cluster C3, also a non-dust regime, is more frequently observed in the eastern part of the IP and differs from C4 mainly by having a much lower real part of the refractive index. After identifying the typical aerosol regimes affecting the IP, we utilized aerosol-type columnar mass density data (dust, organic carbon, black carbon, sea salt, and sulfates) from MERRA-2 to predict the aerosol optical regime at each grid point using the supervised learning methodology Random Forest. We tested the performance of the trained model under various aerosol scenarios. The accuracy of the predictions for the aerosol optical regimes ranged from 60 % to 75 %, depending on the regime, with an average accuracy of 70 %. Notably, the accuracy exceeded 90 % when predicting solely dust or non-dust optical regimes.</p>
      <p id="d2e2840">An analysis of MERRA-2 simulations alongside this study's AERONET cluster-based prescriptions of optical regime indicators, such as absorption (SSA) and size (AE), reveals that MERRA-2 is generally more absorbing for the aerosol optical regimes (C0, C1, C3, and C4) impacting the atmosphere of the Iberian Peninsula, except for the most absorbing regime (C2). Specifically, the reanalysis simulations indicate higher absorption under the non-dust regimes C3 and C4. When examining the relative contributions of fine and coarse modes, the cluster-based prescription indicates a larger average contribution of coarse particles than the MERRA-2 under dust regimes (C0, C1). Conversely, for the non-dust regimes (C2, C3, C4), MERRA-2 shows a lower relative contribution from the fine mode compared to the clusters-based prescription.</p>
      <p id="d2e2843">Our findings contribute to enhancing the understanding of the dynamic aerosol optical properties over the Iberian Peninsula and highlight the potential of machine-learning approaches to improve the representation of aerosol radiative forcing in atmospheric models. Many atmospheric modelling systems are not designed to simulate aerosol-intensive microphysical and optical properties in real time. Additionally, computational cost remains a common limitation worldwide. Our approach integrates AERONET-derived intensive properties based on climatological optical regimes to refine the model, coupled with predicted aerosol-type columnar mass density. This integration can help reduce regional uncertainty in the simulation of aerosol radiative forcing.</p>
      <p id="d2e2846">Nevertheless, we acknowledge that additional research and analysis are necessary to build on the developments and findings presented here. Among the potential limitations and directions for future work, we emphasize the importance of better understanding the impact of AERONET parameter uncertainties on the clustering process, as well as conducting an intercomparison between basic and more advanced clustering approaches. A natural extension of this study would be the development of a comprehensive investigation focused on radiative transfer calculations, within which the proposed method could be thoroughly evaluated.</p>
</sec>

      
      </body>
    <back><notes notes-type="codedataavailability"><title>Code and data availability</title>

      <p id="d2e2854">All the datasets (AERONET and MERRA-2) used in this study are publicly available and were downloaded from their respective websites (<uri>https://aeronet.gsfc.nasa.gov/</uri>, last access: 1 April 2026; and <uri>https://disc.gsfc.nasa.gov/datasets?project=MERRA-2</uri>, last access: 1 April 2026). Code and dataset required to conduct the analyses herein is available at <ext-link xlink:href="https://doi.org/10.5281/zenodo.14825197" ext-link-type="DOI">10.5281/zenodo.14825197</ext-link> (Rosario, 2025).</p>
  </notes><app-group>
        <supplementary-material position="anchor"><p id="d2e2866">The supplement related to this article is available online at <inline-supplementary-material xlink:href="https://doi.org/10.5194/gmd-19-2691-2026-supplement" xlink:title="pdf">https://doi.org/10.5194/gmd-19-2691-2026-supplement</inline-supplementary-material>.</p></supplementary-material>
        </app-group><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e2875">NR, KL and PT designed and performed the research, analyzed the data, and wrote the first version of the paper. MY, SF, LF, OM, HFCV contributed to writing, discussion, review and editing. ICM and AIM conceptualization and coordination of the Project FIRESMOKE, discussion, review and editing.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e2881">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e2887">Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. The authors bear the ultimate responsibility for providing appropriate place names. Views expressed in the text are those of the authors and do not necessarily reflect the views of the publisher.</p>
  </notes><ack><title>Acknowledgements</title><p id="d2e2893">This work was developed as part of the projects FIRESMOKE (<ext-link xlink:href="https://doi.org/10.54499/PTDC/CTA-MET/3392/2020" ext-link-type="DOI">10.54499/PTDC/CTA-MET/3392/2020</ext-link>), LARGEFIRES (<ext-link xlink:href="https://doi.org/10.54499/2023.17415.ICDT" ext-link-type="DOI">10.54499/2023.17415.ICDT</ext-link>) and of CESAM – Centro de Estudos do Ambiente e do Mar (UID/50017/2025 and LA/P/0094/2020). We thank the AERONET and MERRA-2 PIs and teams for their effort in establishing and maintaining the observational sites and reanalysis products used in this study. We acknowledge the use of imagery from the Worldview Snapshots application (<uri>https://wvs.earthdata.nasa.gov</uri>, last access: 1 April 2026), part of the Earth Observing System Data and Information System (EOSDIS). Finally, we would like to acknowledge the constructive review comments by the two anonymous reviewers and the editor.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e2907">The authors acknowledge the financial support of FCT – Science and Technology Portuguese Foundation I.P., which funded the projects FIRESMOKE (<ext-link xlink:href="https://doi.org/10.54499/PTDC/CTA-MET/3392/2020" ext-link-type="DOI">10.54499/PTDC/CTA-MET/3392/2020</ext-link>) and LARGEFIRES (<ext-link xlink:href="https://doi.org/10.54499/2023.17415.ICDT" ext-link-type="DOI">10.54499/2023.17415.ICDT</ext-link>), through national funds. This work was also funded by national funds through FCT, under the project CESAM-Centro de Estudos do Ambiente e do Mar, references UID/50017/2025 (<ext-link xlink:href="https://doi.org/10.54499/UID/50017/2025" ext-link-type="DOI">10.54499/UID/50017/2025</ext-link>) and LA/P/0094/2020 (<ext-link xlink:href="https://doi.org/10.54499/LA/P/0094/2020" ext-link-type="DOI">10.54499/LA/P/0094/2020</ext-link>). The authors also acknowledge the financial support from the Conselho Nacional de Desenvolvimento Científico e Tecnológico (CNPq, Brazil) under grant agreement nos. 441851/2023-1, 172486/2023-8, and 315349/2023-9.</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e2925">This paper was edited by Klaus Klingmüller and reviewed by two anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bib1"><label>1</label><mixed-citation>Abraham, A., Pedregosa, F., Eickenberg, M., Gervais, P., Mueller, A., Kossaifi, J., Gramfort, A., Thirion, B., and Varoquaux, G.: Machine Learning for Neuroimaging with Scikit-Learn, Front. Neuroinform., 8, 14, <ext-link xlink:href="https://doi.org/10.3389/fninf.2014.00014" ext-link-type="DOI">10.3389/fninf.2014.00014</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib2"><label>2</label><mixed-citation>Adebiyi, A. A., Huang, Y., and Samset, B. H.: Observations suggest that North African dust absorbs less solar radiation than models estimate, Commun. Earth Environ., 4, 168, <ext-link xlink:href="https://doi.org/10.1038/s43247-023-00825-2" ext-link-type="DOI">10.1038/s43247-023-00825-2</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib3"><label>3</label><mixed-citation>Alvarez, A., Lecina-Diaz, J., Batllori, E., Duane, A., Brotons, L., and Retana, J.: Spatiotemporal patterns and drivers of extreme fire severity in Spain for the period 1985–2018, Agr. Forest Meteorol., 358, 110185, <ext-link xlink:href="https://doi.org/10.1016/j.agrformet.2024.110185" ext-link-type="DOI">10.1016/j.agrformet.2024.110185</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib4"><label>4</label><mixed-citation>Asfaw, H. W., McGee, T. K., and Correia, F. J.: Wildfire preparedness and response during the 2016 Arouca wildfires in rural Portugal, Int. J. Disast. Risk Reduct., 73, 102895, <ext-link xlink:href="https://doi.org/10.1016/j.ijdrr.2022.102895" ext-link-type="DOI">10.1016/j.ijdrr.2022.102895</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib5"><label>5</label><mixed-citation>Breiman, L.: Random Forests, Mach. Learn., 45, 5–32, <ext-link xlink:href="https://doi.org/10.1023/a:1010933404324" ext-link-type="DOI">10.1023/a:1010933404324</ext-link>, 2001.</mixed-citation></ref>
      <ref id="bib1.bib6"><label>6</label><mixed-citation>Brown, H., Liu, X., Pokhrel, R., Murphy, S., Lu, Z., Saleh, R., Mielonen, T., Kokkola, H., Bergman, T., Myhre, G., Skeie, R. B., Watson-Paris, D., Stier, P., Johnson, B., Bellouin, N., Schulz, M., Vakkari, V., Beukes, J. P., van Zyl, P. G., Liu, S., and Chand, D.: Biomass burning aerosols in most climate models are too absorbing, Nat. Commun., 12, 277, <ext-link xlink:href="https://doi.org/10.1038/s41467-020-20482-9" ext-link-type="DOI">10.1038/s41467-020-20482-9</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib7"><label>7</label><mixed-citation>Buchard, V. J., Randles, C. A., da Silva, A. M., Darmenov, A., Colarco, P. R., Govindaraju, R., Ferrare, R. A., Hair, J., Beyersdorf, A., Ziemba, L. D., and Yu, H.: The MERRA-2 Aerosol Reanalysis, 1980 Onward. Part II: Evaluation and Case Studies, J. Climate, 30, 6851–6872, <ext-link xlink:href="https://doi.org/10.1175/JCLI-D-16-0613.1" ext-link-type="DOI">10.1175/JCLI-D-16-0613.1</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib8"><label>8</label><mixed-citation>Cachorro, V. E., Burgos, M. A., Mateos, D., Toledano, C., Bennouna, Y., Torres, B., de Frutos, Á. M., and Herguedas, Á.: Inventory of African desert dust events in the north-central Iberian Peninsula in 2003–2014 based on sun-photometer–AERONET and particulate-mass–EMEP data, Atmos. Chem. Phys., 16, 8227–8248, <ext-link xlink:href="https://doi.org/10.5194/acp-16-8227-2016" ext-link-type="DOI">10.5194/acp-16-8227-2016</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib9"><label>9</label><mixed-citation>Chen, G., Wang, J., Wang, Y., Wang, J., Jin, Y., and Cheng, Y.: An aerosol optical module with observation-constrained black carbon properties for global climate models, J. Adv. Model. Earth Syst., 15, e2022MS003501, <ext-link xlink:href="https://doi.org/10.1029/2022MS003501" ext-link-type="DOI">10.1029/2022MS003501</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib10"><label>10</label><mixed-citation>Chin, M., Ginoux, P., Kinne, S., Torres, O., Holben, B. N., Duncan, B. N., Martin, R. V., Logan, J. A., Higurashi, A., and Nakajima, T.: Tropospheric aerosol optical thickness from the GOCART model and comparisons with satellite and sun photometer measurements, J. Atmos. Sci., 59, 461–483, <ext-link xlink:href="https://doi.org/10.1175/1520-0469(2002)059&lt;0461:taotft&gt;2.0.co;2" ext-link-type="DOI">10.1175/1520-0469(2002)059&lt;0461:taotft&gt;2.0.co;2</ext-link>, 2002.</mixed-citation></ref>
      <ref id="bib1.bib11"><label>11</label><mixed-citation>Colarco, P., Da Silva, A., Chin, M., and Diehl, T.: Online simulations of global aerosol distributions in the NASA GEOS-4 model and comparisons to satellite and ground-based aerosol optical depth, J. Geophys. Res.-Atmos., 115, D14207, <ext-link xlink:href="https://doi.org/10.1029/2009JD012820" ext-link-type="DOI">10.1029/2009JD012820</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib12"><label>12</label><mixed-citation>Colarco, P. R., Nowottnick, E. P., Randles, C. A., Yi, B., Yang, P., Kim, K. M., Smith, J. A., and Bardeen, C. G.: Impact of radiatively interactive dust aerosols in the NASA GEOS-5 climate model: Sensitivity to dust particle shape and refractive index, J. Geophys. Res.-Atmos., 119, 753–786, <ext-link xlink:href="https://doi.org/10.1002/2013JD020046" ext-link-type="DOI">10.1002/2013JD020046</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib13"><label>13</label><mixed-citation>Dubovik, O. and King, M. D.: A flexible inversion algorithm for retrieval of aerosol optical properties from Sun and sky radiance measurements, J. Geophys. Res., 105, 20673–20696, <ext-link xlink:href="https://doi.org/10.1029/2000JD900282" ext-link-type="DOI">10.1029/2000JD900282</ext-link>, 2000.</mixed-citation></ref>
      <ref id="bib1.bib14"><label>14</label><mixed-citation>Dubovik, O., Holben, B., Eck, T. F., Smirnov, A., Kaufman, Y. J., King, M. D., Tanré, D., and Slutsker, I.: Variability of Absorption and Optical Properties of Key Aerosol Types Observed in Worldwide Locations, J. Atmos. Sci., 59, 590–608, <ext-link xlink:href="https://doi.org/10.1175/1520-0469(2002)059&lt;0590:VOAAOP&gt;2.0.CO;2" ext-link-type="DOI">10.1175/1520-0469(2002)059&lt;0590:VOAAOP&gt;2.0.CO;2</ext-link>, 2002.</mixed-citation></ref>
      <ref id="bib1.bib15"><label>15</label><mixed-citation>Eck, T. F., Holben, B. N., Reid, J. S., Dubovik, O., Smirnov, A., O'Neill, N. T., Slutsker, I., and Kinne, S.: Wavelength dependence of the optical depth of biomass burning, urban, and desert dust aerosols, J. Geophys. Res., 104, 31333–31349, <ext-link xlink:href="https://doi.org/10.1029/1999jd900923" ext-link-type="DOI">10.1029/1999jd900923</ext-link>, 1999.</mixed-citation></ref>
      <ref id="bib1.bib16"><label>16</label><mixed-citation>Elias, T. G., Silva, A. M., Figueira, M. J., Belo, N., Pereira, S., Formenti, P., and Helas, G.: Aerosol extinction and absorption in Évora, Portugal, during the European 2003 summer heat wave, in: Proc. SPIE 5571, Remote Sensing of Clouds and the Atmosphere IX, <ext-link xlink:href="https://doi.org/10.1117/12.566579" ext-link-type="DOI">10.1117/12.566579</ext-link>, 2004.</mixed-citation></ref>
      <ref id="bib1.bib17"><label>17</label><mixed-citation>Ermitão, T., Páscoa, P., Trigo, I., Alonso, C., and Gouveia, C.: Mapping the Most Susceptible Regions to Fire in Portugal, Fire, 6, 254, <ext-link xlink:href="https://doi.org/10.3390/fire6070254" ext-link-type="DOI">10.3390/fire6070254</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib18"><label>18</label><mixed-citation>Fan, Y., Sun, X., Huang, H., Ti, R., and Liu, X.: The primary aerosol models and distribution characteristics over China based on the AERONET data, J. Quant. Spectrosc. Ra., 275, 107888, <ext-link xlink:href="https://doi.org/10.1016/j.jqsrt.2021.107888" ext-link-type="DOI">10.1016/j.jqsrt.2021.107888</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib19"><label>19</label><mixed-citation>Gelaro, R., McCarty, W., Suárez, M. J., Todling, R., Molod, A., Takacs, L., Randles, C. A., Darmenov, A., Bosilovich, M. G., Reichle, R., Wargan, K., Coy, L., Cullather, R., Draper, C., Akella, S., Buchard, V., Conaty, A., da Silva, A. M., Gu, W., Postylyakov, S., Keller, J. H., Gelaro, R., and Pawson, S.: The Modern-Era Retrospective Analysis for Research and Applications, Version 2 (MERRA-2), J. Climate, 30, 5419–5454, <ext-link xlink:href="https://doi.org/10.1175/JCLI-D-16-0758.1" ext-link-type="DOI">10.1175/JCLI-D-16-0758.1</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib20"><label>20</label><mixed-citation>Giles, D. M., Sinyuk, A., Sorokin, M. G., Schafer, J. S., Smirnov, A., Slutsker, I., Eck, T. F., Holben, B. N., Lewis, J. R., Campbell, J. R., Welton, E. J., Korkin, S. V., and Lyapustin, A. I.: Advancements in the Aerosol Robotic Network (AERONET) Version 3 database – automated near-real-time quality control algorithm with improved cloud screening for Sun photometer aerosol optical depth (AOD) measurements, Atmos. Meas. Tech., 12, 169–209, <ext-link xlink:href="https://doi.org/10.5194/amt-12-169-2019" ext-link-type="DOI">10.5194/amt-12-169-2019</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib21"><label>21</label><mixed-citation>Gliß, J., Mortier, A., Schulz, M., Andrews, E., Balkanski, Y., Bauer, S. E., Benedictow, A. M. K., Bian, H., Checa-Garcia, R., Chin, M., Ginoux, P., Griesfeller, J. J., Heckel, A., Kipling, Z., Kirkevåg, A., Kokkola, H., Laj, P., Le Sager, P., Lund, M. T., Lund Myhre, C., Matsui, H., Myhre, G., Neubauer, D., van Noije, T., North, P., Olivié, D. J. L., Rémy, S., Sogacheva, L., Takemura, T., Tsigaridis, K., and Tsyro, S. G.: AeroCom phase III multi-model evaluation of the aerosol life cycle and optical properties using ground- and space-based remote sensing as well as surface in situ observations, Atmos. Chem. Phys., 21, 87–128, <ext-link xlink:href="https://doi.org/10.5194/acp-21-87-2021" ext-link-type="DOI">10.5194/acp-21-87-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib22"><label>22</label><mixed-citation>Gómez-Amo, J. L., Estellés, V., Marcos, C., Segura, S., Esteve, A. R., Pedrós, R., Utrillas, M. P., and Martínez-Lozano, J. A.: Impact of dust and smoke mixing on column-integrated aerosol properties from observations during a severe wildfire episode over Valencia (Spain), Sci. Total Environ., 599–600, 2121–2134, <ext-link xlink:href="https://doi.org/10.1016/j.scitotenv.2017.05.041" ext-link-type="DOI">10.1016/j.scitotenv.2017.05.041</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib23"><label>23</label><mixed-citation>Groß, S., Tesche, M., Freudenthaler, V., Toledano, C., Wiegner, M., Ansmann, A., Althausen, D., and Seefeldner, M.: Characterization of Saharan dust, marine aerosols and mixtures of biomass-burning aerosols and dust by means of multi-wavelength depolarization and Raman lidar measurements during SAMUM 2, Tellus B, 63, 706–724, <ext-link xlink:href="https://doi.org/10.1111/j.1600-0889.2011.00556.x" ext-link-type="DOI">10.1111/j.1600-0889.2011.00556.x</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib24"><label>24</label><mixed-citation>Gupta, P., Remer, L. A., Levy, R. C., and Mattoo, S.: Validation of MODIS 3 km land aerosol optical depth from NASA's EOS Terra and Aqua missions, Atmos. Meas. Tech., 11, 3145–3159, <ext-link xlink:href="https://doi.org/10.5194/amt-11-3145-2018" ext-link-type="DOI">10.5194/amt-11-3145-2018</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib25"><label>25</label><mixed-citation>Hammed, R. A., Alawode, G. L., Montoya, L. E., Krasovskiy, A., and Kraxner, F.: Exploring Drivers of Wildfires in Spain, Land, 13, 762, <ext-link xlink:href="https://doi.org/10.3390/land13060762" ext-link-type="DOI">10.3390/land13060762</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib26"><label>26</label><mixed-citation> Hess, M., Koepke, P., and Schult, I.: Optical properties of aerosols and clouds: The software package OPAC, B. Am. Meteorol. Soc., 79, 831–844, 1998.</mixed-citation></ref>
      <ref id="bib1.bib27"><label>27</label><mixed-citation>Hoelzemann, J. J., Longo, K. M., Fonseca, R. M., do Rosario, N. M. E., Elbern, H., Freitas, S. R., and Pires, C.: Regional representativity of AERONET observation sites during the biomass burning season in South America determined by correlation studies with MODIS Aerosol Optical Depth, J. Geophys. Res., 114, D13301, <ext-link xlink:href="https://doi.org/10.1029/2008jd010369" ext-link-type="DOI">10.1029/2008jd010369</ext-link>, 2009.</mixed-citation></ref>
      <ref id="bib1.bib28"><label>28</label><mixed-citation>Holben, B. N., Eck, T. F., Slutsker, I., Tanre, D., Buis, J. P., Setzer, A., Vermote, E., Reagan, J. A., Kaufman, Y. J., Nakajima, T., Lavenu, F., Jankowiak, I., and Smirnov, A.: AERONET– A Federated Instrument Network and Data Archive for Aerosol Characterization, Remote Sens. Environ., 66, 1–16, <ext-link xlink:href="https://doi.org/10.1016/s0034-4257(98)00031-5" ext-link-type="DOI">10.1016/s0034-4257(98)00031-5</ext-link>, 1998.</mixed-citation></ref>
      <ref id="bib1.bib29"><label>29</label><mixed-citation>Holben, B. N., Eck, T. F., Slutsker, I., Smirnov, A., Sinyuk, A., Schafer, J., Giles, D., and Dubovik, O.: AERONET's version 2.0 quality assurance criteria, Proc. SPIE, 6408, 64080Q, <ext-link xlink:href="https://doi.org/10.1117/12.706524" ext-link-type="DOI">10.1117/12.706524</ext-link>, 2006.</mixed-citation></ref>
      <ref id="bib1.bib30"><label>30</label><mixed-citation>Illingworth, A. J., Barker, H. W., Beljaars, A., Ceccaldi, M., Chepfer, H., Clerbaux, N., Cole, J., Delanoë, J., Domenech, C., Donovan, D. P., Fukuda, S., Hirakata, M., Hogan, R. J., Huenerbein, A., Kollias, P., Kubota, T., Nakajima, T., Nakajima, T. Y., Nishizawa, T., Ohno, Y., Okada, K., Oki, R., Sato, K., Satoh, M., Shephard, M. W., Velázquez-Blázquez, A., Wandinger, U., Wehr, T., and van Zadelhoff, G. J.: The EarthCARE Satellite: The Next Step Forward in Global Measurements of Clouds, Aerosols, Precipitation, and Radiation, B. Am. Meteorol. Soc., 96, 1311–1332, <ext-link xlink:href="https://doi.org/10.1175/BAMS-D-12-00227.1" ext-link-type="DOI">10.1175/BAMS-D-12-00227.1</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib31"><label>31</label><mixed-citation>IPCC: Climate Change 2021 – the Physical Science Basis, in: Contribution of Working Group I to the Sixth Assessment Report of the Intergovernmental Panel on Climate Change, edited by: Masson-Delmotte, V., Zhai, P., Pirani, A., Connors, S. L., Péan, C., Berger, S., Caud, N., Chen, Y., Goldfarb, L., Gomis, M. I., Huang, M., Leitzell, K., Lonnoy, E., Matthews, J. B. R., Maycock, T. K., Waterfield, T., Yelekçi, O., Yu, R., and Zhou, B., Cambridge University Press, Cambridge, UK and New York, NY, USA, <ext-link xlink:href="https://doi.org/10.1017/9781009157896" ext-link-type="DOI">10.1017/9781009157896</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib32"><label>32</label><mixed-citation>Kanitz, T., Ansmann, A., Engelmann, R., and Althausen, D.: North-south cross sections of the vertical aerosol distribution over the Atlantic Ocean from multiwavelength Raman/polarization lidar during Polarstern cruises, J. Geophys. Res.-Atmos., 118, 2643–2655, <ext-link xlink:href="https://doi.org/10.1002/jgrd.50273" ext-link-type="DOI">10.1002/jgrd.50273</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib33"><label>33</label><mixed-citation>Kim, D. and Ramanathan, V.: Solar Radiation Budget and Radiative Forcing Due to Aerosols and Clouds, J. Geophys. Res.-Atmos., 113, D02203, <ext-link xlink:href="https://doi.org/10.1029/2007JD008434" ext-link-type="DOI">10.1029/2007JD008434</ext-link>, 2008.</mixed-citation></ref>
      <ref id="bib1.bib34"><label>34</label><mixed-citation>Koepke, P., Hess, M., Schult, I., and Shettle, E. P.: Global aerosol data set, Rep. 243, Max-Planck-Inst. für Meteorol., Hamburg, Germany, <uri>https://mpimet.mpg.de/fileadmin/publikationen/Reports/max_scirep_243.pdf</uri> (last access: 1 April 2026), 1997.</mixed-citation></ref>
      <ref id="bib1.bib35"><label>35</label><mixed-citation>Krishnaveni, S. A., Madhavan, B. L., and Ratnam, M. V.: Aerosol classification using fuzzy clustering over a tropical rural site, Atmos. Res., 282, 106518, <ext-link xlink:href="https://doi.org/10.1016/j.atmosres.2022.106518" ext-link-type="DOI">10.1016/j.atmosres.2022.106518</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib36"><label>36</label><mixed-citation>Levy, R. C., Remer, L. A., and Dubovik, O.: Global aerosol optical properties and application to Moderate Resolution Imaging Spectroradiometer aerosol retrieval over land, J. Geophys. Res.-Atmos., 112, D13210, <ext-link xlink:href="https://doi.org/10.1029/2006JD007815" ext-link-type="DOI">10.1029/2006JD007815</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib37"><label>37</label><mixed-citation>Levy, R. C., Remer, L. A., Kleidman, R. G., Mattoo, S., Ichoku, C., Kahn, R., and Eck, T. F.: Global evaluation of the Collection 5 MODIS dark-target aerosol products over land, Atmos. Chem. Phys., 10, 10399–10420, <ext-link xlink:href="https://doi.org/10.5194/acp-10-10399-2010" ext-link-type="DOI">10.5194/acp-10-10399-2010</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib38"><label>38</label><mixed-citation>Li, J., Liu, L., Lacis, A. A., and Carlson, B. E.: An optimal fitting approach to improve the GISS ModelE aerosol optical property parameterization using AERONET data, J. Geophys. Res., 115, D16211, <ext-link xlink:href="https://doi.org/10.1029/2010JD013909" ext-link-type="DOI">10.1029/2010JD013909</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib39"><label>39</label><mixed-citation>Li, J., Carlson, B. E., and Yung, Y. L.: Scattering and absorbing aerosols in the climate system, Natl. Rev. Earth Environ., 3, 363–379, <ext-link xlink:href="https://doi.org/10.1038/s43017-022-00296-7" ext-link-type="DOI">10.1038/s43017-022-00296-7</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib40"><label>40</label><mixed-citation> Li, Z., Zhang, Y., Xu, H., Li, K., Dubovik, O., and Goloub, P.: The Fundamental Aerosol Models Over China Region: A Cluster Analysis of the Ground-Based Remote Sensing Measurements of Total Columnar Atmosphere, Geophys. Res. Lett., 46, 4924–4932, 2019.</mixed-citation></ref>
      <ref id="bib1.bib41"><label>41</label><mixed-citation>Martins, J. V., Artaxo, P., Kaufman, Y. J., Castanho, A. D., and Remer, L. A.: Spectral absorption properties of aerosol particles from 350–2500 nm, Geophys. Res. Lett., 36, L13810, <ext-link xlink:href="https://doi.org/10.1029/2009GL037435" ext-link-type="DOI">10.1029/2009GL037435</ext-link>, 2009.</mixed-citation></ref>
      <ref id="bib1.bib42"><label>42</label><mixed-citation> Moise, T., Flores, J. M., and Rudich, Y.: Optical properties of secondary organic aerosols and their changes by chemical processes, Chem. Rev., 115, 4400–4439, 2015.</mixed-citation></ref>
      <ref id="bib1.bib43"><label>43</label><mixed-citation>Omar, A. H., Won, J.-G., Winker, D. M., Yoon, S.-C., Dubovik, O., and McCormick, M. P.: Development of global aerosol models using cluster analysis of Aerosol Robotic Network (AERONET) measurements, J. Geophys. Res., 110, D10S14, <ext-link xlink:href="https://doi.org/10.1029/2004JD004874" ext-link-type="DOI">10.1029/2004JD004874</ext-link>, 2005.</mixed-citation></ref>
      <ref id="bib1.bib44"><label>44</label><mixed-citation>Osborne, M., Malavelle, F. F., Adam, M., Buxmann, J., Sugier, J., Marenco, F., and Haywood, J.: Saharan dust and biomass burning aerosols during ex-hurricane Ophelia: observations from the new UK lidar and sun-photometer network, Atmos. Chem. Phys., 19, 3557–3578, <ext-link xlink:href="https://doi.org/10.5194/acp-19-3557-2019" ext-link-type="DOI">10.5194/acp-19-3557-2019</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib45"><label>45</label><mixed-citation>Pokhrel, R. P., Beamesderfer, E. R., Wagner, N. L., Langridge, J. M., Lack, D. A., Jayarathne, T., Stone, E. A., Stockwell, C. E., Yokelson, R. J., and Murphy, S. M.: Relative importance of black carbon, brown carbon, and absorption enhancement from clear coatings in biomass burning emissions, Atmos. Chem. Phys., 17, 5063–5078, <ext-link xlink:href="https://doi.org/10.5194/acp-17-5063-2017" ext-link-type="DOI">10.5194/acp-17-5063-2017</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib46"><label>46</label><mixed-citation>Proske, U., Ferrachat, S., and Lohmann, U.: Developing a climatological simplification of aerosols to enter the cloud microphysics of a global climate model, Atmos. Chem. Phys., 24, 5907–5933, <ext-link xlink:href="https://doi.org/10.5194/acp-24-5907-2024" ext-link-type="DOI">10.5194/acp-24-5907-2024</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib47"><label>47</label><mixed-citation> Reid, J. S. and Hobbs, P. V.: Physical and optical properties of young smoke from individual biomass fires in Brazil, J. Geophys. Res., 103, 32013–32030, 1998.</mixed-citation></ref>
      <ref id="bib1.bib48"><label>48</label><mixed-citation>Reid, J. S., Eck, T. F., Christopher, S. A., Koppmann, R., Dubovik, O., Eleuterio, D. P., Holben, B. N., Reid, E. A., and Zhang, J.: A review of biomass burning emissions part III: intensive optical properties of biomass burning particles, Atmos. Chem. Phys., 5, 827–849, <ext-link xlink:href="https://doi.org/10.5194/acp-5-827-2005" ext-link-type="DOI">10.5194/acp-5-827-2005</ext-link>, 2005.</mixed-citation></ref>
      <ref id="bib1.bib49"><label>49</label><mixed-citation>Rodríguez, S. and López-Darias, J.: Extreme Saharan dust events expand northward over the Atlantic and Europe, prompting record-breaking PM<sub>10</sub> and PM<sub>2.5</sub> episodes, Atmos. Chem. Phys., 24, 12031–12053, <ext-link xlink:href="https://doi.org/10.5194/acp-24-12031-2024" ext-link-type="DOI">10.5194/acp-24-12031-2024</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib50"><label>50</label><mixed-citation>Rosario, N. E.: Machine learning-driven characterization and prescription of aerosol optical properties for atmospheric models, Zenodo [code an data set], <ext-link xlink:href="https://doi.org/10.5281/zenodo.14825197" ext-link-type="DOI">10.5281/zenodo.14825197</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bib51"><label>51</label><mixed-citation>Rosário, N. E., Longo, K. M., Freitas, S. R., Yamasoe, M. A., and Fonseca, R. M.: Modeling the South American regional smoke plume: aerosol optical depth variability and surface shortwave flux perturbation, Atmos. Chem. Phys., 13, 2923–2938, <ext-link xlink:href="https://doi.org/10.5194/acp-13-2923-2013" ext-link-type="DOI">10.5194/acp-13-2923-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib52"><label>52</label><mixed-citation>Russell, P. B., Kacenelenbogen, M., Livingston, J. M., Hasekamp, O. P., Burton, S. P., Schuster, G. L., Johnson, M. S., Knobelspiesse, K. D., Redemann, J., Ramachandran, S., and Holben, B.: A multiparameter aerosol classification method and its application to retrievals from spaceborne polarimetry, J. Geophys. Res.-Atmos., 119, 9838–9863, <ext-link xlink:href="https://doi.org/10.1002/2013JD021411" ext-link-type="DOI">10.1002/2013JD021411</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib53"><label>53</label><mixed-citation>Saleh, R., Robinson, E. S., Tkacik, D. S., Ahern, A. T., Liu, S., Aiken, A. C., Sullivan, R. C., Presto, A. A., Dubey, M. K., Yokelson, R. J., Donahue, N. M., and Robinson, A. L.: Brownness of organics in aerosols from biomass burning linked to their black carbon content, Nat. Geosci., 7, 647–650, <ext-link xlink:href="https://doi.org/10.1038/ngeo2220" ext-link-type="DOI">10.1038/ngeo2220</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib54"><label>54</label><mixed-citation>Samset, B. H., Stjern, C. W., Andrews, E., Kahn, R. A., Myhre, G., Schulz, M., and Schuster, G. L.: Aerosol Absorption: Progress Towards Global and Regional Constraints, Curr. Clim. Change Rep., 4, 65–83, <ext-link xlink:href="https://doi.org/10.1007/s40641-018-0091-4" ext-link-type="DOI">10.1007/s40641-018-0091-4</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib55"><label>55</label><mixed-citation>Sand, M., Samset, B. H., Myhre, G., Gliß, J., Bauer, S. E., Bian, H., Chin, M., Checa-Garcia, R., Ginoux, P., Kipling, Z., Kirkevåg, A., Kokkola, H., Le Sager, P., Lund, M. T., Matsui, H., van Noije, T., Olivié, D. J. L., Remy, S., Schulz, M., Stier, P., Stjern, C. W., Takemura, T., Tsigaridis, K., Tsyro, S. G., and Watson-Parris, D.: Aerosol absorption in global models from AeroCom phase III, Atmos. Chem. Phys., 21, 15929–15947, <ext-link xlink:href="https://doi.org/10.5194/acp-21-15929-2021" ext-link-type="DOI">10.5194/acp-21-15929-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib56"><label>56</label><mixed-citation>Schwink, S. K., Mael, L. E., Dunnington, T. H., Schmid, M. J., Silberstein, J. M., Heck, A., Gotlib, N., Hannigan, M. P., and Vance, M. E.: Impacts of Aging and Relative Humidity on Properties of Biomass Burning Smoke Particles, ACS EST Air, 2, 109–118, <ext-link xlink:href="https://doi.org/10.1021/acsestair.4c00224" ext-link-type="DOI">10.1021/acsestair.4c00224</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bib57"><label>57</label><mixed-citation>Shettle, E. P. and Fenn, R. W.: Models for the aerosols of the lower atmosphere and the effects of humidity variations on their optical properties, Environmental Research Papers No. 676, AFGL-TR-79-0214, Optical Physics Division, Air Force Geophysics Laboratory, Hanscom AFB, MA, USA, 94 pp., <uri>https://books.google.com/books?id=JSlkjReviS4C</uri> (last access: 1 April 2026), 1979.</mixed-citation></ref>
      <ref id="bib1.bib58"><label>58</label><mixed-citation>Shi, C., Wei, B., and Wei, S.: A quantitative discriminant method of elbow point for the optimal number of clusters in clustering algorithm, J. Wireless Commun. Network, 2021, 31, <ext-link xlink:href="https://doi.org/10.1186/s13638-021-01910-w" ext-link-type="DOI">10.1186/s13638-021-01910-w</ext-link>, 2021. </mixed-citation></ref>
      <ref id="bib1.bib59"><label>59</label><mixed-citation>Shin, S. K., Tesche, M., Kim, K., Kezoudi, M., Tatarov, B., Müller, D., and Noh, Y.: On the spectral depolarisation and lidar ratio of mineral dust provided in the AERONET version 3 inversion product, Atmos. Chem. Phys., 18, 12735–12746, <ext-link xlink:href="https://doi.org/10.5194/acp-18-12735-2018" ext-link-type="DOI">10.5194/acp-18-12735-2018</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib60"><label>60</label><mixed-citation>Silva, P., Carmo, M., Rio, J., and Novo, I.: Changes in the Seasonality of Fire Activity and Fire Weather in Portugal: Is the Wildfire Season Really Longer?, Meteorology, 2, 74–86, <ext-link xlink:href="https://doi.org/10.3390/meteorology2010006" ext-link-type="DOI">10.3390/meteorology2010006</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib61"><label>61</label><mixed-citation>Sinyuk, A., Holben, B. N., Eck, T. F., Giles, D. M., Slutsker, I., Korkin, S., Schafer, J. S., Smirnov, A., Sorokin, M., and Lyapustin, A.: The AERONET Version 3 aerosol retrieval algorithm, associated uncertainties and comparisons to Version 2, Atmos. Meas. Tech., 13, 3375–3411, <ext-link xlink:href="https://doi.org/10.5194/amt-13-3375-2020" ext-link-type="DOI">10.5194/amt-13-3375-2020</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib62"><label>62</label><mixed-citation>Smirnov, A., Holben, B. N., Kaufman, Y. J., Dubovik, O., Eck, T. F., Slutsker, I., Pietras, C., and Halthore, R. N.: Optical Properties of Atmospheric Aerosol in Maritime Environments, J. Atmos. Sci., 59, 501–523, <ext-link xlink:href="https://doi.org/10.1175/1520-0469(2002)059&lt;0501:OPOAAI&gt;2.0.CO;2" ext-link-type="DOI">10.1175/1520-0469(2002)059&lt;0501:OPOAAI&gt;2.0.CO;2</ext-link>, 2002.</mixed-citation></ref>
      <ref id="bib1.bib63"><label>63</label><mixed-citation> Spencer, R. S., Levy, R. C., Remer, L. A., Mattoo, S., Arnold, G. T., Hlavka, D. L., Meyer, K. G., Marshak, A., Wilcox, E. M., and Platnick, S. E.: Exploring Aerosols near Clouds with High-Spatial-Resolution Aircraft Remote Sensing during SEAC(4)RS, J. Geophys. Res.-Atmos., 124, 2148–2173, 2019.</mixed-citation></ref>
      <ref id="bib1.bib64"><label>64</label><mixed-citation>Toledano, C., Cachorro, V. E., de Frutos, A. M., Sorribas, M., and Prats, N.: Inventory of African Desert Dust Events Over the Southwestern Iberian Peninsula in 2000–2005 with an AERONET Cimel Sun Photometer, J. Geophys. Res., 112, D21201, <ext-link xlink:href="https://doi.org/10.1029/2006JD008307" ext-link-type="DOI">10.1029/2006JD008307</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib65"><label>65</label><mixed-citation>Zhao, A., Ryder, C. L., and Wilcox, L. J.: How well do the CMIP6 models simulate dust aerosols?, Atmos. Chem. Phys., 22, 2095–2119, <ext-link xlink:href="https://doi.org/10.5194/acp-22-2095-2022" ext-link-type="DOI">10.5194/acp-22-2095-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib66"><label>66</label><mixed-citation>Zhao, G., Tan, T., Zhao, W., Guo, S., Tian, P., and Zhao, C.: A new parameterization scheme for the real part of the ambient urban aerosol refractive index, Atmos. Chem. Phys., 19, 12875–12885, <ext-link xlink:href="https://doi.org/10.5194/acp-19-12875-2019" ext-link-type="DOI">10.5194/acp-19-12875-2019</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib67"><label>67</label><mixed-citation>Zhong, Q., Schutgens, N., van der Werf, G. R., van Noije, T., Bauer, S. E., Tsigaridis, K., Mielonen, T., Checa-Garcia, R., Neubauer, D., Kipling, Z., Kirkevåg, A., Olivié, D. J. L., Kokkola, H., Matsui, H., Ginoux, P., Takemura, T., Le Sager, P., Rémy, S., Bian, H., and Chin, M.: Using modelled relationships and satellite observations to attribute modelled aerosol biases over biomass burning regions, Nat. Commun., 13, 5914, <ext-link xlink:href="https://doi.org/10.1038/s41467-022-33680-4" ext-link-type="DOI">10.1038/s41467-022-33680-4</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib68"><label>68</label><mixed-citation>Zhou, P., Wang, Y., Liu, J., Xu, L., Chen, X., and Zhang, L.: Difference between global and regional aerosol model classifications and associated implications for spaceborne aerosol optical depth retrieval, Atmos. Environ., 300, 119674, <ext-link xlink:href="https://doi.org/10.1016/j.atmosenv.2023.119674" ext-link-type="DOI">10.1016/j.atmosenv.2023.119674</ext-link>, 2023.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>Machine learning-driven characterization and prescription  of aerosol optical properties for atmospheric models</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>1</label><mixed-citation>
      
Abraham, A., Pedregosa, F., Eickenberg, M., Gervais, P., Mueller, A.,
Kossaifi, J., Gramfort, A., Thirion, B., and Varoquaux, G.: Machine Learning
for Neuroimaging with Scikit-Learn, Front. Neuroinform., 8, 14, <a href="https://doi.org/10.3389/fninf.2014.00014" target="_blank">https://doi.org/10.3389/fninf.2014.00014</a>, 2014.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>2</label><mixed-citation>
      
Adebiyi, A. A., Huang, Y., and Samset, B. H.: Observations suggest that North African dust absorbs less solar radiation than models estimate, Commun. Earth Environ., 4, 168, <a href="https://doi.org/10.1038/s43247-023-00825-2" target="_blank">https://doi.org/10.1038/s43247-023-00825-2</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>3</label><mixed-citation>
      
Alvarez, A., Lecina-Diaz, J., Batllori, E., Duane, A., Brotons, L., and Retana, J.: Spatiotemporal patterns and drivers of extreme fire severity in Spain for the period 1985–2018, Agr. Forest Meteorol., 358, 110185,
<a href="https://doi.org/10.1016/j.agrformet.2024.110185" target="_blank">https://doi.org/10.1016/j.agrformet.2024.110185</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>4</label><mixed-citation>
      
Asfaw, H. W., McGee, T. K., and Correia, F. J.: Wildfire preparedness and
response during the 2016 Arouca wildfires in rural Portugal, Int. J. Disast. Risk Reduct., 73, 102895, <a href="https://doi.org/10.1016/j.ijdrr.2022.102895" target="_blank">https://doi.org/10.1016/j.ijdrr.2022.102895</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>5</label><mixed-citation>
      
Breiman, L.: Random Forests, Mach. Learn., 45, 5–32, <a href="https://doi.org/10.1023/a:1010933404324" target="_blank">https://doi.org/10.1023/a:1010933404324</a>, 2001.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>6</label><mixed-citation>
      
Brown, H., Liu, X., Pokhrel, R., Murphy, S., Lu, Z., Saleh, R., Mielonen, T., Kokkola, H., Bergman, T., Myhre, G., Skeie, R. B., Watson-Paris, D., Stier, P., Johnson, B., Bellouin, N., Schulz, M., Vakkari, V., Beukes, J. P., van Zyl, P. G., Liu, S., and Chand, D.: Biomass burning aerosols in most climate models are too absorbing, Nat. Commun., 12, 277,
<a href="https://doi.org/10.1038/s41467-020-20482-9" target="_blank">https://doi.org/10.1038/s41467-020-20482-9</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>7</label><mixed-citation>
      
Buchard, V. J., Randles, C. A., da Silva, A. M., Darmenov, A., Colarco, P. R., Govindaraju, R., Ferrare, R. A., Hair, J., Beyersdorf, A., Ziemba, L. D., and Yu, H.: The MERRA-2 Aerosol Reanalysis, 1980 Onward. Part II: Evaluation and Case Studies, J. Climate, 30, 6851–6872, <a href="https://doi.org/10.1175/JCLI-D-16-0613.1" target="_blank">https://doi.org/10.1175/JCLI-D-16-0613.1</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>8</label><mixed-citation>
      
Cachorro, V. E., Burgos, M. A., Mateos, D., Toledano, C., Bennouna, Y., Torres, B., de Frutos, Á. M., and Herguedas, Á.: Inventory of African desert dust events in the north-central Iberian Peninsula in 2003–2014 based on sun-photometer–AERONET and particulate-mass–EMEP data, Atmos. Chem. Phys., 16, 8227–8248, <a href="https://doi.org/10.5194/acp-16-8227-2016" target="_blank">https://doi.org/10.5194/acp-16-8227-2016</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>9</label><mixed-citation>
      
Chen, G., Wang, J., Wang, Y., Wang, J., Jin, Y., and Cheng, Y.: An aerosol
optical module with observation-constrained black carbon properties for global climate models, J. Adv. Model. Earth Syst., 15, e2022MS003501,
<a href="https://doi.org/10.1029/2022MS003501" target="_blank">https://doi.org/10.1029/2022MS003501</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>10</label><mixed-citation>
      
Chin, M., Ginoux, P., Kinne, S., Torres, O., Holben, B. N., Duncan, B. N.,
Martin, R. V., Logan, J. A., Higurashi, A., and Nakajima, T.: Tropospheric
aerosol optical thickness from the GOCART model and comparisons with satellite and sun photometer measurements, J. Atmos. Sci., 59, 461–483,
<a href="https://doi.org/10.1175/1520-0469(2002)059&lt;0461:taotft&gt;2.0.co;2" target="_blank">https://doi.org/10.1175/1520-0469(2002)059&lt;0461:taotft&gt;2.0.co;2</a>, 2002.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>11</label><mixed-citation>
      
Colarco, P., Da Silva, A., Chin, M., and Diehl, T.: Online simulations of
global aerosol distributions in the NASA GEOS-4 model and comparisons to
satellite and ground-based aerosol optical depth, J. Geophys. Res.-Atmos., 115, D14207, <a href="https://doi.org/10.1029/2009JD012820" target="_blank">https://doi.org/10.1029/2009JD012820</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>12</label><mixed-citation>
      
Colarco, P. R., Nowottnick, E. P., Randles, C. A., Yi, B., Yang, P., Kim, K.
M., Smith, J. A., and Bardeen, C. G.: Impact of radiatively interactive dust
aerosols in the NASA GEOS-5 climate model: Sensitivity to dust particle
shape and refractive index, J. Geophys. Res.-Atmos., 119, 753–786,
<a href="https://doi.org/10.1002/2013JD020046" target="_blank">https://doi.org/10.1002/2013JD020046</a>, 2014.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>13</label><mixed-citation>
      
Dubovik, O. and King, M. D.: A flexible inversion algorithm for retrieval of aerosol optical properties from Sun and sky radiance measurements, J. Geophys. Res., 105, 20673–20696, <a href="https://doi.org/10.1029/2000JD900282" target="_blank">https://doi.org/10.1029/2000JD900282</a>, 2000.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>14</label><mixed-citation>
      
Dubovik, O., Holben, B., Eck, T. F., Smirnov, A., Kaufman, Y. J., King, M. D., Tanré, D., and Slutsker, I.: Variability of Absorption and Optical
Properties of Key Aerosol Types Observed in Worldwide Locations, J. Atmos.
Sci., 59, 590–608, <a href="https://doi.org/10.1175/1520-0469(2002)059&lt;0590:VOAAOP&gt;2.0.CO;2" target="_blank">https://doi.org/10.1175/1520-0469(2002)059&lt;0590:VOAAOP&gt;2.0.CO;2</a>, 2002.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>15</label><mixed-citation>
      
Eck, T. F., Holben, B. N., Reid, J. S., Dubovik, O., Smirnov, A., O'Neill, N. T., Slutsker, I., and Kinne, S.: Wavelength dependence of the optical depth of biomass burning, urban, and desert dust aerosols, J. Geophys. Res., 104, 31333–31349, <a href="https://doi.org/10.1029/1999jd900923" target="_blank">https://doi.org/10.1029/1999jd900923</a>, 1999.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>16</label><mixed-citation>
      
Elias, T. G., Silva, A. M., Figueira, M. J., Belo, N., Pereira, S.,
Formenti, P., and Helas, G.: Aerosol extinction and absorption in Évora,
Portugal, during the European 2003 summer heat wave, in: Proc. SPIE 5571, Remote Sensing of Clouds and the Atmosphere IX, <a href="https://doi.org/10.1117/12.566579" target="_blank">https://doi.org/10.1117/12.566579</a>,
2004.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>17</label><mixed-citation>
      
Ermitão, T., Páscoa, P., Trigo, I., Alonso, C., and Gouveia, C.:
Mapping the Most Susceptible Regions to Fire in Portugal, Fire, 6, 254,
<a href="https://doi.org/10.3390/fire6070254" target="_blank">https://doi.org/10.3390/fire6070254</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>18</label><mixed-citation>
      
Fan, Y., Sun, X., Huang, H., Ti, R., and Liu, X.: The primary aerosol models
and distribution characteristics over China based on the AERONET data, J.
Quant. Spectrosc. Ra., 275, 107888, <a href="https://doi.org/10.1016/j.jqsrt.2021.107888" target="_blank">https://doi.org/10.1016/j.jqsrt.2021.107888</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>19</label><mixed-citation>
      
Gelaro, R., McCarty, W., Suárez, M. J., Todling, R., Molod, A., Takacs,
L., Randles, C. A., Darmenov, A., Bosilovich, M. G., Reichle, R., Wargan, K., Coy, L., Cullather, R., Draper, C., Akella, S., Buchard, V., Conaty, A., da Silva, A. M., Gu, W., Postylyakov, S., Keller, J. H., Gelaro, R., and
Pawson, S.: The Modern-Era Retrospective Analysis for Research and Applications, Version 2 (MERRA-2), J. Climate, 30, 5419–5454,
<a href="https://doi.org/10.1175/JCLI-D-16-0758.1" target="_blank">https://doi.org/10.1175/JCLI-D-16-0758.1</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>20</label><mixed-citation>
      
Giles, D. M., Sinyuk, A., Sorokin, M. G., Schafer, J. S., Smirnov, A., Slutsker, I., Eck, T. F., Holben, B. N., Lewis, J. R., Campbell, J. R., Welton, E. J., Korkin, S. V., and Lyapustin, A. I.: Advancements in the Aerosol Robotic Network (AERONET) Version 3 database – automated near-real-time quality control algorithm with improved cloud screening for Sun photometer aerosol optical depth (AOD) measurements, Atmos. Meas. Tech., 12, 169–209, <a href="https://doi.org/10.5194/amt-12-169-2019" target="_blank">https://doi.org/10.5194/amt-12-169-2019</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>21</label><mixed-citation>
      
Gliß, J., Mortier, A., Schulz, M., Andrews, E., Balkanski, Y., Bauer, S. E., Benedictow, A. M. K., Bian, H., Checa-Garcia, R., Chin, M., Ginoux, P., Griesfeller, J. J., Heckel, A., Kipling, Z., Kirkevåg, A., Kokkola, H., Laj, P., Le Sager, P., Lund, M. T., Lund Myhre, C., Matsui, H., Myhre, G., Neubauer, D., van Noije, T., North, P., Olivié, D. J. L., Rémy, S., Sogacheva, L., Takemura, T., Tsigaridis, K., and Tsyro, S. G.: AeroCom phase III multi-model evaluation of the aerosol life cycle and optical properties using ground- and space-based remote sensing as well as surface in situ observations, Atmos. Chem. Phys., 21, 87–128, <a href="https://doi.org/10.5194/acp-21-87-2021" target="_blank">https://doi.org/10.5194/acp-21-87-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>22</label><mixed-citation>
      
Gómez-Amo, J. L., Estellés, V., Marcos, C., Segura, S., Esteve, A. R., Pedrós, R., Utrillas, M. P., and Martínez-Lozano, J. A.: Impact
of dust and smoke mixing on column-integrated aerosol properties from
observations during a severe wildfire episode over Valencia (Spain), Sci.
Total Environ., 599–600, 2121–2134, <a href="https://doi.org/10.1016/j.scitotenv.2017.05.041" target="_blank">https://doi.org/10.1016/j.scitotenv.2017.05.041</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>23</label><mixed-citation>
      
Groß, S., Tesche, M., Freudenthaler, V., Toledano, C., Wiegner, M., Ansmann, A., Althausen, D., and Seefeldner, M.: Characterization of Saharan
dust, marine aerosols and mixtures of biomass-burning aerosols and dust by
means of multi-wavelength depolarization and Raman lidar measurements during
SAMUM 2, Tellus B, 63, 706–724, <a href="https://doi.org/10.1111/j.1600-0889.2011.00556.x" target="_blank">https://doi.org/10.1111/j.1600-0889.2011.00556.x</a>, 2011.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>24</label><mixed-citation>
      
Gupta, P., Remer, L. A., Levy, R. C., and Mattoo, S.: Validation of MODIS 3&thinsp;km land aerosol optical depth from NASA's EOS Terra and Aqua missions, Atmos. Meas. Tech., 11, 3145–3159, <a href="https://doi.org/10.5194/amt-11-3145-2018" target="_blank">https://doi.org/10.5194/amt-11-3145-2018</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>25</label><mixed-citation>
      
Hammed, R. A., Alawode, G. L., Montoya, L. E., Krasovskiy, A., and Kraxner, F.: Exploring Drivers of Wildfires in Spain, Land, 13, 762,
<a href="https://doi.org/10.3390/land13060762" target="_blank">https://doi.org/10.3390/land13060762</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>26</label><mixed-citation>
      
Hess, M., Koepke, P., and Schult, I.: Optical properties of aerosols and clouds: The software package OPAC, B. Am. Meteorol. Soc., 79, 831–844, 1998.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>27</label><mixed-citation>
      
Hoelzemann, J. J., Longo, K. M., Fonseca, R. M., do Rosario, N. M. E., Elbern, H., Freitas, S. R., and Pires, C.: Regional representativity of AERONET observation sites during the biomass burning season in South America
determined by correlation studies with MODIS Aerosol Optical Depth, J. Geophys. Res., 114, D13301, <a href="https://doi.org/10.1029/2008jd010369" target="_blank">https://doi.org/10.1029/2008jd010369</a>, 2009.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>28</label><mixed-citation>
      
Holben, B. N., Eck, T. F., Slutsker, I., Tanre, D., Buis, J. P., Setzer, A.,
Vermote, E., Reagan, J. A., Kaufman, Y. J., Nakajima, T., Lavenu, F., Jankowiak, I., and Smirnov, A.: AERONET– A Federated Instrument Network and
Data Archive for Aerosol Characterization, Remote Sens. Environ., 66, 1–16,
<a href="https://doi.org/10.1016/s0034-4257(98)00031-5" target="_blank">https://doi.org/10.1016/s0034-4257(98)00031-5</a>, 1998.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>29</label><mixed-citation>
      
Holben, B. N., Eck, T. F., Slutsker, I., Smirnov, A., Sinyuk, A., Schafer, J., Giles, D., and Dubovik, O.: AERONET's version 2.0 quality assurance criteria, Proc. SPIE, 6408, 64080Q, <a href="https://doi.org/10.1117/12.706524" target="_blank">https://doi.org/10.1117/12.706524</a>, 2006.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>30</label><mixed-citation>
      
Illingworth, A. J., Barker, H. W., Beljaars, A., Ceccaldi, M., Chepfer, H.,
Clerbaux, N., Cole, J., Delanoë, J., Domenech, C., Donovan, D. P., Fukuda, S., Hirakata, M., Hogan, R. J., Huenerbein, A., Kollias, P., Kubota, T., Nakajima, T., Nakajima, T. Y., Nishizawa, T., Ohno, Y., Okada, K., Oki,
R., Sato, K., Satoh, M., Shephard, M. W., Velázquez-Blázquez, A.,
Wandinger, U., Wehr, T., and van Zadelhoff, G. J.: The EarthCARE Satellite:
The Next Step Forward in Global Measurements of Clouds, Aerosols, Precipitation, and Radiation, B. Am. Meteorol. Soc., 96, 1311–1332,
<a href="https://doi.org/10.1175/BAMS-D-12-00227.1" target="_blank">https://doi.org/10.1175/BAMS-D-12-00227.1</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>31</label><mixed-citation>
      
IPCC: Climate Change 2021 – the Physical Science Basis, in: Contribution of
Working Group I to the Sixth Assessment Report of the Intergovernmental Panel on Climate Change, edited by: Masson-Delmotte, V., Zhai, P., Pirani, A., Connors, S. L., Péan, C., Berger, S., Caud, N., Chen, Y., Goldfarb, L., Gomis, M. I., Huang, M., Leitzell, K., Lonnoy, E., Matthews, J. B. R., Maycock, T. K., Waterfield, T., Yelekçi, O., Yu, R., and Zhou, B., Cambridge University Press, Cambridge, UK and New York, NY, USA, <a href="https://doi.org/10.1017/9781009157896" target="_blank">https://doi.org/10.1017/9781009157896</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>32</label><mixed-citation>
      
Kanitz, T., Ansmann, A., Engelmann, R., and Althausen, D.: North-south cross
sections of the vertical aerosol distribution over the Atlantic Ocean from
multiwavelength Raman/polarization lidar during Polarstern cruises, J. Geophys. Res.-Atmos., 118, 2643–2655, <a href="https://doi.org/10.1002/jgrd.50273" target="_blank">https://doi.org/10.1002/jgrd.50273</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>33</label><mixed-citation>
      
Kim, D. and Ramanathan, V.: Solar Radiation Budget and Radiative Forcing Due to Aerosols and Clouds, J. Geophys. Res.-Atmos., 113, D02203,
<a href="https://doi.org/10.1029/2007JD008434" target="_blank">https://doi.org/10.1029/2007JD008434</a>, 2008.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>34</label><mixed-citation>
      
Koepke, P., Hess, M., Schult, I., and Shettle, E. P.: Global aerosol data
set, Rep. 243, Max-Planck-Inst. für Meteorol., Hamburg, Germany, <a href="https://mpimet.mpg.de/fileadmin/publikationen/Reports/max_scirep_243.pdf" target="_blank"/> (last access: 1 April 2026), 1997.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>35</label><mixed-citation>
      
Krishnaveni, S. A., Madhavan, B. L., and Ratnam, M. V.: Aerosol classification using fuzzy clustering over a tropical rural site, Atmos. Res., 282, 106518, <a href="https://doi.org/10.1016/j.atmosres.2022.106518" target="_blank">https://doi.org/10.1016/j.atmosres.2022.106518</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>36</label><mixed-citation>
      
Levy, R. C., Remer, L. A., and Dubovik, O.: Global aerosol optical properties and application to Moderate Resolution Imaging Spectroradiometer aerosol retrieval over land, J. Geophys. Res.-Atmos., 112, D13210, <a href="https://doi.org/10.1029/2006JD007815" target="_blank">https://doi.org/10.1029/2006JD007815</a>, 2007.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>37</label><mixed-citation>
      
Levy, R. C., Remer, L. A., Kleidman, R. G., Mattoo, S., Ichoku, C., Kahn, R., and Eck, T. F.: Global evaluation of the Collection 5 MODIS dark-target aerosol products over land, Atmos. Chem. Phys., 10, 10399–10420,
<a href="https://doi.org/10.5194/acp-10-10399-2010" target="_blank">https://doi.org/10.5194/acp-10-10399-2010</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>38</label><mixed-citation>
      
Li, J., Liu, L., Lacis, A. A., and Carlson, B. E.: An optimal fitting approach to improve the GISS ModelE aerosol optical property parameterization using AERONET data, J. Geophys. Res., 115, D16211, <a href="https://doi.org/10.1029/2010JD013909" target="_blank">https://doi.org/10.1029/2010JD013909</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>39</label><mixed-citation>
      
Li, J., Carlson, B. E., and Yung, Y. L.: Scattering and absorbing aerosols in the climate system, Natl. Rev. Earth Environ., 3, 363–379,
<a href="https://doi.org/10.1038/s43017-022-00296-7" target="_blank">https://doi.org/10.1038/s43017-022-00296-7</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>40</label><mixed-citation>
      
Li, Z., Zhang, Y., Xu, H., Li, K., Dubovik, O., and Goloub, P.: The Fundamental Aerosol Models Over China Region: A Cluster Analysis of the
Ground-Based Remote Sensing Measurements of Total Columnar Atmosphere, Geophys. Res. Lett., 46, 4924–4932, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>41</label><mixed-citation>
      
Martins, J. V., Artaxo, P., Kaufman, Y. J., Castanho, A. D., and Remer, L. A.: Spectral absorption properties of aerosol particles from 350–2500&thinsp;nm,
Geophys. Res. Lett., 36, L13810, <a href="https://doi.org/10.1029/2009GL037435" target="_blank">https://doi.org/10.1029/2009GL037435</a>, 2009.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>42</label><mixed-citation>
      
Moise, T., Flores, J. M., and Rudich, Y.: Optical properties of secondary
organic aerosols and their changes by chemical processes, Chem. Rev., 115,
4400–4439, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>43</label><mixed-citation>
      
Omar, A. H., Won, J.-G., Winker, D. M., Yoon, S.-C., Dubovik, O., and McCormick, M. P.: Development of global aerosol models using cluster analysis of Aerosol Robotic Network (AERONET) measurements, J. Geophys. Res., 110, D10S14, <a href="https://doi.org/10.1029/2004JD004874" target="_blank">https://doi.org/10.1029/2004JD004874</a>, 2005.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>44</label><mixed-citation>
      
Osborne, M., Malavelle, F. F., Adam, M., Buxmann, J., Sugier, J., Marenco,
F., and Haywood, J.: Saharan dust and biomass burning aerosols during ex-hurricane Ophelia: observations from the new UK lidar and sun-photometer
network, Atmos. Chem. Phys., 19, 3557–3578, <a href="https://doi.org/10.5194/acp-19-3557-2019" target="_blank">https://doi.org/10.5194/acp-19-3557-2019</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>45</label><mixed-citation>
      
Pokhrel, R. P., Beamesderfer, E. R., Wagner, N. L., Langridge, J. M., Lack, D. A., Jayarathne, T., Stone, E. A., Stockwell, C. E., Yokelson, R. J., and Murphy, S. M.: Relative importance of black carbon, brown carbon, and absorption enhancement from clear coatings in biomass burning emissions, Atmos. Chem. Phys., 17, 5063–5078, <a href="https://doi.org/10.5194/acp-17-5063-2017" target="_blank">https://doi.org/10.5194/acp-17-5063-2017</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>46</label><mixed-citation>
      
Proske, U., Ferrachat, S., and Lohmann, U.: Developing a climatological
simplification of aerosols to enter the cloud microphysics of a global climate model, Atmos. Chem. Phys., 24, 5907–5933, <a href="https://doi.org/10.5194/acp-24-5907-2024" target="_blank">https://doi.org/10.5194/acp-24-5907-2024</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>47</label><mixed-citation>
      
Reid, J. S. and Hobbs, P. V.: Physical and optical properties of young smoke from individual biomass fires in Brazil, J. Geophys. Res., 103, 32013–32030, 1998.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>48</label><mixed-citation>
      
Reid, J. S., Eck, T. F., Christopher, S. A., Koppmann, R., Dubovik, O.,
Eleuterio, D. P., Holben, B. N., Reid, E. A., and Zhang, J.: A review of biomass burning emissions part III: intensive optical properties of biomass
burning particles, Atmos. Chem. Phys., 5, 827–849, <a href="https://doi.org/10.5194/acp-5-827-2005" target="_blank">https://doi.org/10.5194/acp-5-827-2005</a>, 2005.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>49</label><mixed-citation>
      
Rodríguez, S. and López-Darias, J.: Extreme Saharan dust events expand northward over the Atlantic and Europe, prompting record-breaking
PM<sub>10</sub> and PM<sub>2.5</sub> episodes, Atmos. Chem. Phys., 24, 12031–12053,
<a href="https://doi.org/10.5194/acp-24-12031-2024" target="_blank">https://doi.org/10.5194/acp-24-12031-2024</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>50</label><mixed-citation>
      
Rosario, N. E.: Machine learning-driven characterization and prescription of
aerosol optical properties for atmospheric models, Zenodo [code an data set], <a href="https://doi.org/10.5281/zenodo.14825197" target="_blank">https://doi.org/10.5281/zenodo.14825197</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib51"><label>51</label><mixed-citation>
      
Rosário, N. E., Longo, K. M., Freitas, S. R., Yamasoe, M. A., and Fonseca, R. M.: Modeling the South American regional smoke plume: aerosol
optical depth variability and surface shortwave flux perturbation, Atmos.
Chem. Phys., 13, 2923–2938, <a href="https://doi.org/10.5194/acp-13-2923-2013" target="_blank">https://doi.org/10.5194/acp-13-2923-2013</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib52"><label>52</label><mixed-citation>
      
Russell, P. B., Kacenelenbogen, M., Livingston, J. M., Hasekamp, O. P.,
Burton, S. P., Schuster, G. L., Johnson, M. S., Knobelspiesse, K. D., Redemann, J., Ramachandran, S., and Holben, B.: A multiparameter aerosol
classification method and its application to retrievals from spaceborne
polarimetry, J. Geophys. Res.-Atmos., 119, 9838–9863,
<a href="https://doi.org/10.1002/2013JD021411" target="_blank">https://doi.org/10.1002/2013JD021411</a>, 2014.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib53"><label>53</label><mixed-citation>
      
Saleh, R., Robinson, E. S., Tkacik, D. S., Ahern, A. T., Liu, S., Aiken, A.
C., Sullivan, R. C., Presto, A. A., Dubey, M. K., Yokelson, R. J., Donahue, N. M., and Robinson, A. L.: Brownness of organics in aerosols from biomass
burning linked to their black carbon content, Nat. Geosci., 7, 647–650,
<a href="https://doi.org/10.1038/ngeo2220" target="_blank">https://doi.org/10.1038/ngeo2220</a>, 2014.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib54"><label>54</label><mixed-citation>
      
Samset, B. H., Stjern, C. W., Andrews, E., Kahn, R. A., Myhre, G., Schulz, M., and Schuster, G. L.: Aerosol Absorption: Progress Towards Global and
Regional Constraints, Curr. Clim. Change Rep., 4, 65–83,
<a href="https://doi.org/10.1007/s40641-018-0091-4" target="_blank">https://doi.org/10.1007/s40641-018-0091-4</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib55"><label>55</label><mixed-citation>
      
Sand, M., Samset, B. H., Myhre, G., Gliß, J., Bauer, S. E., Bian, H.,
Chin, M., Checa-Garcia, R., Ginoux, P., Kipling, Z., Kirkevåg, A., Kokkola, H., Le Sager, P., Lund, M. T., Matsui, H., van Noije, T., Olivié, D. J. L., Remy, S., Schulz, M., Stier, P., Stjern, C. W., Takemura, T., Tsigaridis, K., Tsyro, S. G., and Watson-Parris, D.: Aerosol
absorption in global models from AeroCom phase III, Atmos. Chem. Phys., 21,
15929–15947, <a href="https://doi.org/10.5194/acp-21-15929-2021" target="_blank">https://doi.org/10.5194/acp-21-15929-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib56"><label>56</label><mixed-citation>
      
Schwink, S. K., Mael, L. E., Dunnington, T. H., Schmid, M. J., Silberstein,
J. M., Heck, A., Gotlib, N., Hannigan, M. P., and Vance, M. E.: Impacts of
Aging and Relative Humidity on Properties of Biomass Burning Smoke Particles, ACS EST Air, 2, 109–118, <a href="https://doi.org/10.1021/acsestair.4c00224" target="_blank">https://doi.org/10.1021/acsestair.4c00224</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib57"><label>57</label><mixed-citation>
      
Shettle, E. P. and Fenn, R. W.: Models for the aerosols of the lower atmosphere and the effects of humidity variations on their optical properties, Environmental Research Papers No. 676, AFGL-TR-79-0214, Optical Physics Division, Air Force Geophysics Laboratory, Hanscom AFB, MA, USA, 94&thinsp;pp., <a href="https://books.google.com/books?id=JSlkjReviS4C" target="_blank"/> (last access: 1 April 2026), 1979.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib58"><label>58</label><mixed-citation>
      
Shi, C., Wei, B., and Wei, S.: A quantitative discriminant method of elbow
point for the optimal number of clusters in clustering algorithm, J. Wireless Commun. Network, 2021, 31, <a href="https://doi.org/10.1186/s13638-021-01910-w" target="_blank">https://doi.org/10.1186/s13638-021-01910-w</a>, 2021.


    </mixed-citation></ref-html>
<ref-html id="bib1.bib59"><label>59</label><mixed-citation>
      
Shin, S. K., Tesche, M., Kim, K., Kezoudi, M., Tatarov, B., Müller, D.,
and Noh, Y.: On the spectral depolarisation and lidar ratio of mineral dust
provided in the AERONET version 3 inversion product, Atmos. Chem. Phys., 18,
12735–12746, <a href="https://doi.org/10.5194/acp-18-12735-2018" target="_blank">https://doi.org/10.5194/acp-18-12735-2018</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib60"><label>60</label><mixed-citation>
      
Silva, P., Carmo, M., Rio, J., and Novo, I.: Changes in the Seasonality of
Fire Activity and Fire Weather in Portugal: Is the Wildfire Season Really
Longer?, Meteorology, 2, 74–86, <a href="https://doi.org/10.3390/meteorology2010006" target="_blank">https://doi.org/10.3390/meteorology2010006</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib61"><label>61</label><mixed-citation>
      
Sinyuk, A., Holben, B. N., Eck, T. F., Giles, D. M., Slutsker, I., Korkin, S., Schafer, J. S., Smirnov, A., Sorokin, M., and Lyapustin, A.: The AERONET
Version 3 aerosol retrieval algorithm, associated uncertainties and
comparisons to Version 2, Atmos. Meas. Tech., 13, 3375–3411,
<a href="https://doi.org/10.5194/amt-13-3375-2020" target="_blank">https://doi.org/10.5194/amt-13-3375-2020</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib62"><label>62</label><mixed-citation>
      
Smirnov, A., Holben, B. N., Kaufman, Y. J., Dubovik, O., Eck, T. F., Slutsker, I., Pietras, C., and Halthore, R. N.: Optical Properties of Atmospheric Aerosol in Maritime Environments, J. Atmos. Sci., 59, 501–523,
<a href="https://doi.org/10.1175/1520-0469(2002)059&lt;0501:OPOAAI&gt;2.0.CO;2" target="_blank">https://doi.org/10.1175/1520-0469(2002)059&lt;0501:OPOAAI&gt;2.0.CO;2</a>, 2002.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib63"><label>63</label><mixed-citation>
      
Spencer, R. S., Levy, R. C., Remer, L. A., Mattoo, S., Arnold, G. T., Hlavka, D. L., Meyer, K. G., Marshak, A., Wilcox, E. M., and Platnick, S. E.: Exploring Aerosols near Clouds with High-Spatial-Resolution Aircraft Remote Sensing during SEAC(4)RS, J. Geophys. Res.-Atmos., 124, 2148–2173, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib64"><label>64</label><mixed-citation>
      
Toledano, C., Cachorro, V. E., de Frutos, A. M., Sorribas, M., and Prats, N.: Inventory of African Desert Dust Events Over the Southwestern Iberian Peninsula in 2000–2005 with an AERONET Cimel Sun Photometer, J. Geophys. Res., 112, D21201, <a href="https://doi.org/10.1029/2006JD008307" target="_blank">https://doi.org/10.1029/2006JD008307</a>, 2007.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib65"><label>65</label><mixed-citation>
      
Zhao, A., Ryder, C. L., and Wilcox, L. J.: How well do the CMIP6 models simulate dust aerosols?, Atmos. Chem. Phys., 22, 2095–2119, <a href="https://doi.org/10.5194/acp-22-2095-2022" target="_blank">https://doi.org/10.5194/acp-22-2095-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib66"><label>66</label><mixed-citation>
      
Zhao, G., Tan, T., Zhao, W., Guo, S., Tian, P., and Zhao, C.: A new parameterization scheme for the real part of the ambient urban aerosol
refractive index, Atmos. Chem. Phys., 19, 12875–12885,
<a href="https://doi.org/10.5194/acp-19-12875-2019" target="_blank">https://doi.org/10.5194/acp-19-12875-2019</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib67"><label>67</label><mixed-citation>
      
Zhong, Q., Schutgens, N., van der Werf, G. R., van Noije, T., Bauer, S. E.,
Tsigaridis, K., Mielonen, T., Checa-Garcia, R., Neubauer, D., Kipling, Z.,
Kirkevåg, A., Olivié, D. J. L., Kokkola, H., Matsui, H., Ginoux, P.,
Takemura, T., Le Sager, P., Rémy, S., Bian, H., and Chin, M.: Using
modelled relationships and satellite observations to attribute modelled
aerosol biases over biomass burning regions, Nat. Commun., 13, 5914,
<a href="https://doi.org/10.1038/s41467-022-33680-4" target="_blank">https://doi.org/10.1038/s41467-022-33680-4</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib68"><label>68</label><mixed-citation>
      
Zhou, P., Wang, Y., Liu, J., Xu, L., Chen, X., and Zhang, L.: Difference
between global and regional aerosol model classifications and associated
implications for spaceborne aerosol optical depth retrieval, Atmos. Environ., 300, 119674, <a href="https://doi.org/10.1016/j.atmosenv.2023.119674" target="_blank">https://doi.org/10.1016/j.atmosenv.2023.119674</a>, 2023.

    </mixed-citation></ref-html>--></article>
