<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="3.0" xml:lang="en" article-type="research article">
 <front>
  <journal-meta>
   <journal-id journal-id-type="publisher-id">
    ojap
   </journal-id>
   <journal-title-group>
    <journal-title>
     Open Journal of Air Pollution
    </journal-title>
   </journal-title-group>
   <issn pub-type="epub">
    2169-2653
   </issn>
   <issn publication-format="print">
    2169-2661
   </issn>
   <publisher>
    <publisher-name>
     Scientific Research Publishing
    </publisher-name>
   </publisher>
  </journal-meta>
  <article-meta>
   <article-id pub-id-type="doi">
    10.4236/ojap.2025.144006
   </article-id>
   <article-id pub-id-type="publisher-id">
    ojap-146987
   </article-id>
   <article-categories>
    <subj-group subj-group-type="heading">
     <subject>
      Articles
     </subject>
    </subj-group>
    <subj-group subj-group-type="Discipline-v2">
     <subject>
      Earth 
     </subject>
     <subject>
       Environmental Sciences
     </subject>
    </subj-group>
   </article-categories>
   <title-group>
    Using Machine Learning Models to Predict Daily PM
    <sub>10</sub> Concentration in the Wet Savanna of Lamto Station in Côte d’Ivoire
   </title-group>
   <contrib-group>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Touré E.
      </surname>
      <given-names>
       N’Datchoh
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Money
      </surname>
      <given-names>
       Ossohou
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref> 
     <xref ref-type="aff" rid="aff2"> 
      <sup>2</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Adama
      </surname>
      <given-names>
       Bamba
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Yoman C. E.
      </surname>
      <given-names>
       Etien
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff2"> 
      <sup>2</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Kouakou
      </surname>
      <given-names>
       Kouadio
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref> 
     <xref ref-type="aff" rid="aff3"> 
      <sup>3</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Fidèle
      </surname>
      <given-names>
       Yoroba
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref> 
     <xref ref-type="aff" rid="aff3"> 
      <sup>3</sup>
     </xref> 
     <xref ref-type="aff" rid="aff4"> 
      <sup>4</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Madina
      </surname>
      <given-names>
       Doumbia
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref> 
     <xref ref-type="aff" rid="aff5"> 
      <sup>5</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Mohamed L.
      </surname>
      <given-names>
       Kassamba-Diaby
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref> 
     <xref ref-type="aff" rid="aff6"> 
      <sup>6</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Sylvain
      </surname>
      <given-names>
       Gnamien
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref>
    </contrib>
    <contrib contrib-type="author" xlink:type="simple">
     <name name-style="western">
      <surname>
       Véronique
      </surname>
      <given-names>
       Yoboué
      </given-names>
     </name> 
     <xref ref-type="aff" rid="aff1"> 
      <sup>1</sup>
     </xref> 
     <xref ref-type="aff" rid="aff6"> 
      <sup>6</sup>
     </xref>
    </contrib>
   </contrib-group> 
   <aff id="aff1">
    <addr-line>
     aUFR SSMT, LASMES, University Félix Houphouët-Boigny, Abidjan, Côte d’Ivoire
    </addr-line> 
   </aff> 
   <aff id="aff2">
    <addr-line>
     aDepartment of Physics, University of Man, Man, Côte d’Ivoire
    </addr-line> 
   </aff> 
   <aff id="aff3">
    <addr-line>
     aStation Geophysic of Lamto, N’Douci, Côte d’Ivoire
    </addr-line> 
   </aff> 
   <aff id="aff4">
    <addr-line>
     aUFR Sciences of Technology, Department of Physics, University Alassane Ouattara of Bouaké, Bouaké, Côte d’Ivoire
    </addr-line> 
   </aff> 
   <aff id="aff5">
    <addr-line>
     aUniversity Peleforo Gon Coulibaly, Korhogo, Côte d’Ivoire
    </addr-line> 
   </aff> 
   <aff id="aff6">
    <addr-line>
     aUniversity Nangui Abrogoua, Abidjan, Côte d’Ivoire
    </addr-line> 
   </aff> 
   <pub-date pub-type="epub">
    <day>
     05
    </day> 
    <month>
     11
    </month>
    <year>
     2025
    </year>
   </pub-date> 
   <volume>
    14
   </volume> 
   <issue>
    04
   </issue>
   <fpage>
    73
   </fpage>
   <lpage>
    100
   </lpage>
   <history>
    <date date-type="received">
     <day>
      31,
     </day>
     <month>
      August
     </month>
     <year>
      2025
     </year>
    </date>
    <date date-type="published">
     <day>
      2,
     </day>
     <month>
      August
     </month>
     <year>
      2025
     </year> 
    </date> 
    <date date-type="accepted">
     <day>
      2,
     </day>
     <month>
      November
     </month>
     <year>
      2025
     </year> 
    </date>
   </history>
   <permissions>
    <copyright-statement>
     © Copyright 2014 by authors and Scientific Research Publishing Inc. 
    </copyright-statement>
    <copyright-year>
     2014
    </copyright-year>
    <license>
     <license-p>
      This work is licensed under the Creative Commons Attribution International License (CC BY). http://creativecommons.org/licenses/by/4.0/
     </license-p>
    </license>
   </permissions>
   <abstract>
    Despite its significant impacts on climate, environment, and public health, air pollution monitoring in Africa is still sparse. This study developed a machine learning framework of four models—namely SARIMAX, Random Forest, XGBoost, and LightGBM—that were trained on a daily basis using 25 meteorological variables from ERA5 reanalysis to reproduce daily PM
    <sub>10</sub> surface concentrations in Lamto, Côte d’Ivoire. A total of 2225 daily recorded concentrations from 2017 to 2023 were used, with 80% (1780 days) allocated to training the models and 20% (445 days) for prediction. An assessment of ERA5 reanalysis data against in-situ measurements highlighted its ability to reproduce the pattern of meteorological variables such as temperature and relative humidity, despite some biases. Results show that all models were able to reproduce the observed PM
    <sub>10</sub> variations, although they slightly overestimated concentrations during the main wet season (March-April-May-June-July) and underestimated high pollution events in the main dry season (November-December-January-February). Finally, performance analysis revealed that the Random Forest model outperformed, with an R
    <sup>2</sup> of 0.78 and RMSE of 23 µg/m
    <sup>3</sup>, outperforming the other models. This framework successfully demonstrates the utility of machine learning for air quality prediction in West Africa, with potential for future improvements through bias correction and model combination.
   </abstract>
   <kwd-group> 
    <kwd>
     Lamto
    </kwd> 
    <kwd>
      Prediction
    </kwd> 
    <kwd>
      PM
     <sub>10</sub>
    </kwd> 
    <kwd>
      Machine Learning
    </kwd> 
    <kwd>
      Air Pollution
    </kwd> 
    <kwd>
      Performance
    </kwd>
   </kwd-group>
  </article-meta>
 </front>
 <body>
  <sec id="s1">
   <title>1. Introduction</title>
   <p>Human beings, through their activities, have strongly impacted and shaped their environment, including the Earth’s atmospheric composition. Since the Industrial Revolution in the 18<sup>th</sup> century, numerous compounds have been released into the atmosphere. These atmospheric compounds are responsible for current global warming, which induces climate change <xref ref-type="bibr" rid="scirp.146987-1">
     [1]
    </xref> <xref ref-type="bibr" rid="scirp.146987-2">
     [2]
    </xref>. They contain aerosols, defined as particulate matter in a solid or liquid state suspended in the atmosphere. These aerosols are reported to play a significant role in the climate through their direct, indirect, and semi-direct effects <xref ref-type="bibr" rid="scirp.146987-3">
     [3]
    </xref> <xref ref-type="bibr" rid="scirp.146987-4">
     [4]
    </xref>. Their size distribution in the total suspended particles is often classified into three (3) modes: coarse (PM<sub>10</sub>), fine (PM<sub>2.5</sub>), and ultra-fine (PM<sub>1</sub>) particles. Their lifetime in the atmosphere is strongly dependent on their mode <xref ref-type="bibr" rid="scirp.146987-5">
     [5]
    </xref> and generally ranges from a few hours to several weeks. The coarse mode particles tend to be deposited close to their sources, while fine and ultra-fine particles, which contribute to particulate matter (PM), have a longer lifetime and can undergo long-range transport. These particles contribute to air quality deterioration and have numerous impacts on climate, ecosystems, and human health <xref ref-type="bibr" rid="scirp.146987-6">
     [6]
    </xref>-<xref ref-type="bibr" rid="scirp.146987-8">
     [8]
    </xref>.</p>
   <p>Air quality and its impacts in West Africa have drawn attention in several works, revealing increasing air pollution affecting population health <xref ref-type="bibr" rid="scirp.146987-9">
     [9]
    </xref> <xref ref-type="bibr" rid="scirp.146987-10">
     [10]
    </xref>. In urban areas, they are often investigated using ground-based observations <xref ref-type="bibr" rid="scirp.146987-11">
     [11]
    </xref>-<xref ref-type="bibr" rid="scirp.146987-15">
     [15]
    </xref>, satellite <xref ref-type="bibr" rid="scirp.146987-16">
     [16]
    </xref>, and modeling <xref ref-type="bibr" rid="scirp.146987-17">
     [17]
    </xref> <xref ref-type="bibr" rid="scirp.146987-18">
     [18]
    </xref>. During the Dynamics-Aerosol-Chemistry-Cloud Interactions in West Africa (DACCIWA) project, numerous studies have highlighted that anthropogenic pollutants emitted from the coastal region of the Guinean Coast were transported to remote areas <xref ref-type="bibr" rid="scirp.146987-19">
     [19]
    </xref> <xref ref-type="bibr" rid="scirp.146987-20">
     [20]
    </xref>. As urban areas’ air quality received considerable attention, only a few studies have focused on air quality in rural areas. Investigating daily Aerosol Optical Depth (AOD) in 11 stations across various biomes of Southwest Africa, Niamien <xref ref-type="bibr" rid="scirp.146987-21">
     [21]
    </xref> found that their AOD ranged from 0.35 in the Sahel area to 0.49 in the Guinea Coast area, and a maximum of 0.53 was observed in the savanna area. Moreover, the International Network to study Deposition and Atmospheric Chemistry in Africa (INDAAF, <xref ref-type="bibr" rid="scirp.146987-https://indaaf.obs-mip.fr">
     https://indaaf.obs-mip.fr
    </xref>), has allowed researchers to focus attention on the atmospheric chemical composition of various biomes and rural areas in Africa <xref ref-type="bibr" rid="scirp.146987-22">
     [22]
    </xref>-<xref ref-type="bibr" rid="scirp.146987-25">
     [25]
    </xref>. For example, Lamto atmospheric composition was reported to be influenced by emissions from both local and regional sources, particularly from mesoscale sources with a strong anthropogenic signature <xref ref-type="bibr" rid="scirp.146987-26">
     [26]
    </xref>.</p>
   <p>Another important aspect of air quality degradation is its strong impact on the environment and human health. According to the World Health Organization (WHO), air pollution is responsible for more than 7 million premature deaths every year, particularly affecting urban and peri-urban areas in developing countries <xref ref-type="bibr" rid="scirp.146987-27">
     [27]
    </xref>. In Africa, a report on the current situation of air quality highlighted an increase in air pollution across the continent, which was responsible for 250,000 premature deaths in 2018 <xref ref-type="bibr" rid="scirp.146987-28">
     [28]
    </xref>. Among these air pollutants, aerosols, particularly PM<sub>10</sub>, are recognized as some of the most harmful components for both human health and ecosystems. For instance, PM<sub>10</sub> is linked to respiratory and cardiovascular diseases and contributes to climate imbalance <xref ref-type="bibr" rid="scirp.146987-29">
     [29]
    </xref>. Moreover, prolonged exposure to high concentrations of PM<sub>10</sub> has been associated with increased hospital admissions for respiratory conditions such as asthma, obstructive lung disease, and pulmonary infections. A connection between peaks in PM<sub>10</sub> levels and deaths induced by cardiovascular disease has been indicated through strong correlations, highlighting an increase in myocardial infarction, stroke, and hypertension <xref ref-type="bibr" rid="scirp.146987-30">
     [30]
    </xref>. Despite their hazardous nature, monitoring of these particles remains limited, especially in West Africa, where the high cost of referenced instruments and the scarce infrastructure obstruct continuous monitoring. This lack of data compromises the implementation of effective public policies for air quality management. However, certain scientific initiatives, such as the INDAAF program, have enabled the regular and long-term collection of atmospheric chemistry data from multiple sites in Africa <xref ref-type="bibr" rid="scirp.146987-22">
     [22]
    </xref>-<xref ref-type="bibr" rid="scirp.146987-25">
     [25]
    </xref>. Over Lamto, an INDAAF supersite located in the center of Côte d’Ivoire, the atmospheric chemistry composition is monitored. The composition of the atmosphere at this station is the result of complex interactions between natural and anthropogenic sources in a rural area <xref ref-type="bibr" rid="scirp.146987-26">
     [26]
    </xref>. This makes Lamto an ideal site for studying how particulate compounds interact with meteorological conditions. However, spatiotemporal coverage remains too limited for full operational monitoring of this area. In response to these structural limitations, the integration of new technological approaches is emerging as a promising alternative. Among them, Artificial Intelligence (AI), and more specifically Machine Learning (ML) methods, offer powerful tools to compensate for the lack of data and improve predictive capabilities. The ML algorithms usually can analyze data from various sources, including air quality sensors, satellite imaging, and weather data, to provide real-time information on air quality <xref ref-type="bibr" rid="scirp.146987-31">
     [31]
    </xref>-<xref ref-type="bibr" rid="scirp.146987-33">
     [33]
    </xref>. Information about air pollution sources, pollution levels, and attenuation actions can be provided by these algorithms under the conditions they have been trained to recognize patterns and trends in the data <xref ref-type="bibr" rid="scirp.146987-32">
     [32]
    </xref>. However, all these algorithms do not perform similarly, and their choice may be highly dependent on the nature of pollutants and the purpose of the study. For example, in their health-related research, Dobrea <xref ref-type="bibr" rid="scirp.146987-34">
     [34]
    </xref> compared other AI-oriented techniques/models for air pollutants and suggested Support Vector Regression (SVR) and AutoRegressive Integrated Moving Average (ARIMA) as the best-performing techniques for time series analysis of PM<sub>10</sub> and PM<sub>2.5</sub>. Moreover, some works emphasized that hybrid models have better performance and present several advantages for environmental monitoring policy and decision-making <xref ref-type="bibr" rid="scirp.146987-35">
     [35]
    </xref> <xref ref-type="bibr" rid="scirp.146987-36">
     [36]
    </xref>. Therefore, by exploiting existing data, these techniques enable the anticipation of changes in pollutant levels such as PM<sub>10</sub>, thereby supporting environmental management efforts, even in low-resource settings. Their capacity to identify complex, non-linear relationships makes them particularly suitable for environments like Lamto, where multiple factors influence atmospheric processes. In this context, the present study aims to explore for the first time the potential of Artificial Intelligence (AI) models to reproduce and predict PM<sub>10</sub> concentrations at Lamto over seven years (2017-2023). To achieve this, four AI models were employed, and their performances were assessed.</p>
  </sec><sec id="s2">
   <title>2. Materials and Methods</title>
   <sec id="s2_1">
    <title>2.1. Sampling Site</title>
    <p>Lamto is a station located at 6˚13'N and 5˚2'W, approximately 120 km from Abidjan (Côte d’Ivoire), situated within the humid savanna (<xref ref-type="fig" rid="fig1">
      Figure 1
     </xref>). The Lamto reserve was established in 1962, covering about 2,617 ha, and has been the subject of numerous research studies <xref ref-type="bibr" rid="scirp.146987-37">
      [37]
     </xref>-<xref ref-type="bibr" rid="scirp.146987-42">
      [42]
     </xref>. The reserve contains various measurement observation sites for seismology, infrasound, climatology, Greenhouse Gas (CarboAfrica European project,<xref ref-type="bibr" rid="scirp.146987-http://www.carboafrica.eu/"></xref><xref ref-type="bibr" rid="scirp.146987-http://www.carboafrica.eu/">
      http://www.carboafrica.eu/
     </xref>), atmospheric mercury, atmospheric chemistry (INDAAF), and ecology. The reserve is often burned around mid-January to remove epigenetic phytomass and conduct ecological experiments <xref ref-type="bibr" rid="scirp.146987-41">
      [41]
     </xref> <xref ref-type="bibr" rid="scirp.146987-42">
      [42]
     </xref>. The climate of the Lamto reserve is governed by the West African Monsoon (WAM) and the seasonal shift of the Intertropical Convergence Zone (ITCZ). The annual mean rainfall ranges between approximately 1240 and 1590 mm <xref ref-type="bibr" rid="scirp.146987-40">
      [40]
     </xref>, with four main seasons: a dry season (November to February), a wet season (March to July), a slightly dry season in August, due to monsoon jump, and a slightly wet season from September to November (monsoon retreat). Temperatures are relatively hot throughout the year, averaging around 27˚C, while</p>
    <fig id="fig1" position="float">
     <label>Figure 1</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 1. (a) Localization map of the Lamto-(Côte d’Ivoire) reserve (6˚31'N-5˚02'W). The green point indicates the Lamto location; numbers in red are the mean annual precipitation (1962-1997) of some synoptic stations, and from north to south, are located the types of vegetation <xref ref-type="bibr" rid="scirp.146987-43">
        [43]
       </xref>; and (b) zoom on the vegetation of Lamto <xref ref-type="bibr" rid="scirp.146987-44">
        [44]
       </xref>.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId16.jpeg?20251105021456" />
    </fig>
    <p>relative humidity varies between 65% (minimum in January during the main dry season) and 82% (maximum in June during the main and first rainy season).</p>
   </sec>
   <sec id="s2_2">
    <title>2.2. Data</title>
    <p>The PM<sub>10</sub> concentration data used in our study were retrieved using the TEOM (Tapered Element Oscillating Microbalance) 1400A, covering seven years from January 1, 2017 to December 31, 2023, at the Lamto station <xref ref-type="bibr" rid="scirp.146987-45">
      [45]
     </xref>. Lamto is one of the super sites of the INDAAF program (<xref ref-type="bibr" rid="scirp.146987-https://indaaf.obs-mip.fr/">
      https://indaaf.obs-mip.fr/
     </xref>). INDAAF is a National Observation Service (SNO) of the Institut National des Sciences de l’Univers (INSU) of the Centre National de Recherche Scientifique (CNRS) and is supported by Institut de Recherche pour le Développement (IRD). These PM<sub>10</sub> concentration data are available on the INDAAF program website at an hourly scale in micrograms per cubic meter (μg/m<sup>3</sup>). To reduce the number of missing values, we aggregated the PM<sub>10</sub> data to compute daily averages. This approach led to 16.43% missing values across the entire dataset.</p>
    <p>Hourly weather and climate parameter data were extracted from the ERA5 database <xref ref-type="bibr" rid="scirp.146987-46">
      [46]
     </xref> at the grid point closest to the Lamto station. ERA5 is the fifth generation of reanalyses from the European Centre for Medium-Range Weather Forecasts (ECMWF). The data, available from 1940 to the present day, relate to climate and weather conditions on a global scale over the last eight decades. For the present work, 25 meteorological variables (<xref ref-type="table" rid="table1">
      Table 1
     </xref>) have been selected from January 1, 2017 to December 31, 2023. These variables were chosen because they are known to represent weather conditions and atmospheric dynamics. Indeed, these variables relate to wind, temperature, humidity, the planetary boundary layer, and precipitation, which are known to influence the dispersion, accumulation, and leaching of aerosols <xref ref-type="bibr" rid="scirp.146987-47">
      [47]
     </xref>-<xref ref-type="bibr" rid="scirp.146987-50">
      [50]
     </xref>.</p>
    <table-wrap id="table1">
     <label>
      <xref ref-type="table" rid="table1">
       Table 1
      </xref></label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Table 1. List of ERA5 meteorological variables used for the machine learning model training and prediction of PM<sub>10</sub> concentration.</title>
     </caption>
     <table class="MsoTableGrid custom-table" border="0" cellspacing="0" cellpadding="0"> 
      <tr> 
       <td class="custom-bottom-td acenter" width="50.02%"><p style="text-align:center">Parameters</p></td> 
       <td class="custom-bottom-td acenter" width="49.98%"><p style="text-align:center">Description</p></td> 
      </tr> 
      <tr> 
       <td class="custom-top-td acenter" width="50.02%"><p style="text-align:center">Zonal wind at 100 m</p></td> 
       <td class="custom-top-td acenter" width="49.98%"><p style="text-align:center">East-west component of wind at 100 m</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Meridional wind at 100 m</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">North-south component of wind at 100 m</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Zonal wind at 10 m</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">East-west component of wind at 10 m</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Meridional wind at 10 m</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">North-south component of wind at 10 m</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Air temperature at 2 m</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Near-surface air temperature</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Dew point temperature at 2 m</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Temperature at which air becomes saturated</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Maximum daily air temperature at 2 m</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Daily maximum air temperature near the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Minimum daily air temperature at 2 m</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Daily minimum air temperature near the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Planetary boundary layer height</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Height of the atmospheric boundary layer</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Turbulent surface stress (east)</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Surface stress in the eastward direction</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Turbulent surface stress (north)</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Surface stress in the northward direction</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Frictional velocity</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Surface friction velocity</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Mean evaporation rate</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Average evaporation rate</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Mean sea level pressure</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Atmospheric pressure at sea level</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Surface pressure</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Atmospheric pressure at the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Mean solar radiation flux downward at the surface</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Incoming solar radiation at the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Net solar radiation flux at the surface</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Net radiation balance at the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Surface latent heat flux</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Latent heat exchange at the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Surface sensible heat flux</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Sensible heat exchange at the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Soil temperature-surface layer</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Soil temperature near the surface</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Soil volumetric water content (layer 1)</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Soil moisture content in the first layer</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Total column water (precipitation)</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Integrated water vapour column</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Total cloud cover</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Fraction of sky covered by clouds</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Total precipitation</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Precipitation amount</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.02%"><p style="text-align:center">Integrated vertical divergence of humidity</p></td> 
       <td class="acenter" width="49.98%"><p style="text-align:center">Vertical divergence of moisture flux</p></td> 
      </tr> 
     </table>
    </table-wrap>
   </sec>
   <sec id="s2_3">
    <title>2.3. Models, Training, and Evaluation</title>
    <p>To achieve the goals of this study, four machine learning models were used (<xref ref-type="table" rid="table2">
      Table 2
     </xref>). Their performances are based on their ability to process linear and non-linear relationships between variables, regression and classification, boosting skills, memory efficiency, etc.</p>
    <p>
     <xref ref-type="bibr" rid="scirp.146987-"></xref>Table 2. Brief description of the different models used in this study.</p>
    <table class="MsoTableGrid custom-table" border="0" cellspacing="0" cellpadding="0"> 
     <tr> 
      <td class="custom-bottom-td acenter" width="16.16%"><p style="text-align:center">Models</p></td> 
      <td class="custom-bottom-td acenter" width="30.82%"><p style="text-align:center">Description</p></td> 
      <td class="custom-bottom-td acenter" width="21.84%"><p style="text-align:center">Output/analyzed parameters</p></td> 
     </tr> 
     <tr> 
      <td class="custom-top-td acenter" width="16.16%"><p style="text-align:center">SARIMAX model</p></td> 
      <td class="custom-top-td acenter" width="30.82%"><p style="text-align:center">Linear relationship between the variable to be predicted and its past values (autocorrelation)</p></td> 
      <td class="custom-top-td acenter" width="21.84%"><p style="text-align:center">Temporal dynamics of PM<sub>10</sub></p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="16.16%"><p style="text-align:center">Random forest model</p></td> 
      <td class="acenter" width="30.82%"><p style="text-align:center">A multitude of decision trees <xref ref-type="bibr" rid="scirp.146987-51">
         [51]
        </xref></p><p style="text-align:center">Handling complex, noisy, and non-linear relationships</p><p style="text-align:center">Classification and regression tasks</p></td> 
      <td class="acenter" width="21.84%"><p style="text-align:center">Temporal dynamics of PM<sub>10</sub></p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="16.16%"><p style="text-align:center">XGBoost model</p></td> 
      <td class="acenter" width="30.82%"><p style="text-align:center">Boosting technique: chaining together several weak (shallow) decision trees to build a powerful model.</p></td> 
      <td class="acenter" width="21.84%"><p style="text-align:center">Temporal dynamics of PM<sub>10</sub></p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="16.16%"><p style="text-align:center">LightGBM model</p></td> 
      <td class="acenter" width="30.82%"><p style="text-align:center">Optimized for speed and memory efficiency, enforced particularly by its training strategy based on leaf-wise growth rather than level-wise growth.</p></td> 
      <td class="acenter" width="21.84%"><p style="text-align:center">Temporal dynamics of PM<sub>10</sub></p></td> 
     </tr> 
    </table>
    <p>For this study, the data were split into two distinct parts. The first part, representing 80% of the total data length, constitutes a training set. This training set contains 80% of the oldest observations, i.e., starting from January 1, 2017. The second part of the data, representing the remaining 20% of the total data length, lies in the most recent period, i.e., closest to December 31, 2023. This split follows a strict temporal logic in which no random permutation of the data (shuffle) was carried out, which is essential in time series to preserve the coherence of the chronology of events. Respecting the order of the dates avoids any leakage of information from the future to the past at the learning stage, which would distort the model’s actual performance under prediction conditions. The choice of the 80/20 ratio is widely recognised as a good compromise between the quantity of data for training and the robustness of the evaluation <xref ref-type="bibr" rid="scirp.146987-52">
      [52]
     </xref>.</p>
    <p>Model training is a decisive stage in the modelling chain. The model training objective is to adjust the internal parameters of the algorithms so that they learn, from the training data, to predict the PM<sub>10</sub> concentration as a function of the meteorological variables selected. The rigor of this stage directly conditions the quality and robustness of future predictions, as well as the reliability of the assessment. In keeping with the temporal nature of the data, the models were trained solely on the training set (representing 80% of the data), with the remaining 20% being reserved for the test. No random resampling (shuffle) was carried out, in accordance with good practice in time series modelling <xref ref-type="bibr" rid="scirp.146987-53">
      [53]
     </xref>, in order to preserve the chronological order essential for model consistency.</p>
    <p>When modelling time series, it is essential to assess the robustness of the models while respecting the temporal structure of the data. Unlike the classic cross-validation method, which assumes the independence of observations and uses random partitions, time series require a specific approach to avoid the biases linked to time dependency. To meet this requirement, the cross-validation method adapted to time series was used, as described by scikit-learn in its official documentation. This method, called TimeSeriesSplit, divides the data into several segments while preserving the chronological order. Each successive segment uses a larger portion of the training data, followed by a test set that is immediately later in time. The use of TimeSeriesSplit provides a more realistic assessment of model performance on unseen data, while avoiding the data leakage problems that could arise with inappropriate cross-validation methods for time series.</p>
    <p>The exploratory analysis shows that the year 2023 has 58.63% missing data. Aware of this irregularity, we chose to restrict the study period to the time segment running from 14 January 2017 to 16 February 2023, a period during which data coverage is much more satisfactory. This delimitation made it possible to significantly reduce the overall rate of missing values to 8.99%, a proportion generally considered acceptable for modern imputation methods <xref ref-type="bibr" rid="scirp.146987-54">
      [54]
     </xref>.</p>
    <p>Performance evaluation is a crucial stage in the predictive modelling process, as it enables us to judge the accuracy, robustness, and practical usefulness of the model. Three metrics commonly adopted in time series prediction work were used, namely, the mean absolute error (MAE), the root mean square error (RMSE), and the coefficient of determination (R<sup>2</sup>).</p>
    <p>MAE (Equation (1)) measures the average absolute deviation between the predicted and observed values. It is simple to interpret and not very sensitive to outliers, but it does not consider the dispersion of errors.</p>
    <p>
     <math xmlns="http://www.w3.org/1998/Math/MathML"> <mrow> 
       <mi>
         M 
       </mi> 
       <mi>
         A 
       </mi> 
       <mi>
         E 
       </mi> 
       <mo>
         = 
       </mo> 
       <mfrac> 
        <mn>
          1 
        </mn> 
        <mi>
          n 
        </mi> 
       </mfrac> 
       <munderover> 
        <mstyle mathsize="140%" displaystyle="true"> 
         <mo>
           ∑ 
         </mo> 
        </mstyle> 
        <mrow> 
         <mi>
           i 
         </mi> 
         <mo>
           = 
         </mo> 
         <mn>
           1 
         </mn> 
        </mrow> 
        <mi>
          n 
        </mi> 
       </munderover> 
       <mrow> 
        <mo>
          | 
        </mo> 
        <mrow> 
         <msub> 
          <mi>
            y 
          </mi> 
          <mi>
            i 
          </mi> 
         </msub> 
         <mo>
           − 
         </mo> 
         <msub> 
          <mover accent="true"> 
           <mi>
             y 
           </mi> 
           <mo>
             ^ 
           </mo> 
          </mover> 
          <mi>
            i 
          </mi> 
         </msub> 
        </mrow> 
        <mo>
          | 
        </mo> 
       </mrow> 
      </mrow> 
     </math> (1)</p>
    <p>where:</p>
    <p>RMSE is the square root of the average of the squared deviations between the actual and predicted values. It is shown in Equation (2):</p>
    <p>
     <math xmlns="http://www.w3.org/1998/Math/MathML"> <mrow> 
       <mi>
         R 
       </mi> 
       <mi>
         M 
       </mi> 
       <mi>
         S 
       </mi> 
       <mi>
         E 
       </mi> 
       <mo>
         = 
       </mo> 
       <msqrt> 
        <mrow> 
         <mfrac> 
          <mn>
            1 
          </mn> 
          <mi>
            n 
          </mi> 
         </mfrac> 
         <munderover> 
          <mstyle mathsize="140%" displaystyle="true"> 
           <mo>
             ∑ 
           </mo> 
          </mstyle> 
          <mrow> 
           <mi>
             i 
           </mi> 
           <mo>
             = 
           </mo> 
           <mn>
             1 
           </mn> 
          </mrow> 
          <mi>
            n 
          </mi> 
         </munderover> 
         <msup> 
          <mrow> 
           <mrow> 
            <mo>
              ( 
            </mo> 
            <mrow> 
             <msub> 
              <mi>
                y 
              </mi> 
              <mi>
                i 
              </mi> 
             </msub> 
             <mo>
               − 
             </mo> 
             <msub> 
              <mover accent="true"> 
               <mi>
                 y 
               </mi> 
               <mo>
                 ^ 
               </mo> 
              </mover> 
              <mi>
                i 
              </mi> 
             </msub> 
            </mrow> 
            <mo>
              ) 
            </mo> 
           </mrow> 
          </mrow> 
          <mn>
            2 
          </mn> 
         </msup> 
        </mrow> 
       </msqrt> 
      </mrow> 
     </math> (2)</p>
    <p>This metric gives greater weight to large errors. It is, therefore, particularly useful for detecting models that fail to correctly predict peaks in pollution, a critical aspect of air quality.</p>
    <p>Coefficient of determination (R<sup>2</sup>)</p>
    <p>The coefficient of determination, R<sup>2</sup> given in Equation (3), measures the proportion of the variance in the observed data that the model explains.</p>
    <p>
     <math xmlns="http://www.w3.org/1998/Math/MathML"> <mrow> 
       <msup> 
        <mi>
          R 
        </mi> 
        <mn>
          2 
        </mn> 
       </msup> 
       <mo>
         = 
       </mo> 
       <mn>
         1 
       </mn> 
       <mo>
         − 
       </mo> 
       <mfrac> 
        <mrow> 
         <msubsup> 
          <mstyle mathsize="140%" displaystyle="true"> 
           <mo>
             ∑ 
           </mo> 
          </mstyle> 
          <mrow> 
           <mi>
             i 
           </mi> 
           <mo>
             = 
           </mo> 
           <mn>
             1 
           </mn> 
          </mrow> 
          <mi>
            n 
          </mi> 
         </msubsup> 
         <msup> 
          <mrow> 
           <mrow> 
            <mo>
              ( 
            </mo> 
            <mrow> 
             <msub> 
              <mi>
                y 
              </mi> 
              <mi>
                i 
              </mi> 
             </msub> 
             <mo>
               − 
             </mo> 
             <msub> 
              <mover accent="true"> 
               <mi>
                 y 
               </mi> 
               <mo>
                 ^ 
               </mo> 
              </mover> 
              <mi>
                i 
              </mi> 
             </msub> 
            </mrow> 
            <mo>
              ) 
            </mo> 
           </mrow> 
          </mrow> 
          <mn>
            2 
          </mn> 
         </msup> 
        </mrow> 
        <mrow> 
         <msubsup> 
          <mstyle mathsize="140%" displaystyle="true"> 
           <mo>
             ∑ 
           </mo> 
          </mstyle> 
          <mrow> 
           <mi>
             i 
           </mi> 
           <mo>
             = 
           </mo> 
           <mn>
             1 
           </mn> 
          </mrow> 
          <mi>
            n 
          </mi> 
         </msubsup> 
         <msup> 
          <mrow> 
           <mrow> 
            <mo>
              ( 
            </mo> 
            <mrow> 
             <msub> 
              <mi>
                y 
              </mi> 
              <mi>
                i 
              </mi> 
             </msub> 
             <mo>
               − 
             </mo> 
             <mover accent="true"> 
              <mi>
                y 
              </mi> 
              <mo>
                ¯ 
              </mo> 
             </mover> 
            </mrow> 
            <mo>
              ) 
            </mo> 
           </mrow> 
          </mrow> 
          <mn>
            2 
          </mn> 
         </msup> 
        </mrow> 
       </mfrac> 
      </mrow> 
     </math> (3)</p>
    <p>
     <xref ref-type="bibr" rid="scirp.146987-"></xref>where 
     <math xmlns="http://www.w3.org/1998/Math/MathML"> <mover accent="true"> 
       <mi>
         y 
       </mi> 
       <mo>
         ¯ 
       </mo> 
      </mover> 
     </math> is the mean of the actual values. An R<sup>2</sup> value close to 1 indicates that the model explains the variability of PM<sub>10</sub> concentrations well, while a negative value means that the model performs worse than a simple average.</p>
   </sec>
  </sec><sec id="s3">
   <title>3. Results and Discussion</title>
   <sec id="s3_1">
    <title>3.1. Assessment of ERA5 Data over Lamto</title>
    <p>Time series of daily air temperature at 2 m (<xref ref-type="fig" rid="fig2(a)">
      Figure 2(a)
     </xref>), daily minimum (<xref ref-type="fig" rid="fig2(b)">
      Figure 2(b)
     </xref>) and maximum (<xref ref-type="fig" rid="fig2(c)">
      Figure 2(c)
     </xref>) temperature, as well as relative humidity at the synoptic hours 06:00 UTC (<xref ref-type="fig" rid="fig2(d)">
      Figure 2(d)
     </xref>), 12:00 UTC (<xref ref-type="fig" rid="fig2(e)">
      Figure 2(e)
     </xref>), and 18:00 UTC (<xref ref-type="fig" rid="fig2(f)">
      Figure 2(f)
     </xref>) from 14 January 2017 to 16 February 2023 for the ERA5 and in-situ are compared. Results show that the diurnal cycle of these selected variables is quite well reproduced in the ERA5 reanalysis. However, ERA5 is underestimating the 2 m daily air temperature as well as the daily maximum temperature. The air temperature at 2 m fluctuates between 21.3˚C and 27.9˚C for ERA5 and between 22.7˚C and 33.8˚C for the in-situ. Mean daily air temperature is about 24.5˚C and 28.7˚C for ERA5 and in-situ measurements. Daily maximum temperature varies between 21.5˚C and 27.8˚C with a mean of 24.5˚C for ERA5, and 22.0˚C and 41.5˚C with a mean of 34.2˚C for in-situ measurements, respectively. When considering the daily minimum temperature, ERA5 is slightly warmer than the in-situ measured data at Lamto. ERA5 exhibits maximum temperature ranging from 21.2˚C to 27.5˚C with a mean of 24.3˚C, while the in-situ values range from 16 to 34.9˚C. It can be noticed that the extreme events characterized by a sharp increase or decrease in the temperature magnitude are poorly reproduced in the ERA5 data. This indicates a poor performance of using ERA5 to investigate extreme events over the Lamto station.</p>
    <fig id="fig2" position="float">
     <label>Figure 2</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 2. Timeseries comparison of daily air temperature at 2 m (a), daily minimum (b), and maximum (c) temperature, and relative humidity at the synoptic hours 06:00 UTC (d), 12:00 UTC (e), and 18:00 UTC (f) for the ERA5 and in-situ data between 14<sup>th</sup> January 2017 and 16<sup>th</sup> February 2023.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId32.jpeg?20251105021501" />
    </fig>
    <p>Analyzing the relative humidity comparison between ERA5 and in-situ recorded at synoptic hours, it can be observed that the main features (diurnal cycle, seasonality, etc.) match and the magnitude between the two datasets is in the same range. At 06:00 UTC, it varies from 51% to 100% with a mean of 95% for ERA5 and from 43.6% to 100% with a mean of 95% for the in-situ data. At 12:00 UTC, relative humidity fluctuates from 19.2% to 97% with a mean of 65% for ERA5, and for the in-situ, values range from 15.3% to 100% with a mean value of 66.7%. The mean relative humidity from the ERA5 reanalysis at 18:00 UTC is about 73.6% (range of 13.5% to 99.9%), and for the in-situ, the mean humidity is about 69.7% (range of 16.9% to 99.1%).</p>
    <p>
     <xref ref-type="fig" rid="fig3">
      Figure 3
     </xref> shows the Spearman correlation between the in-situ and ERA5 variables. Quite good and strong correlations (r varying from 0.48 to 0.73) are found between the temperature variables, and quite moderate correlations (r varying from 0.22 to 0.65) are found between the relative humidity variables, significant with p-values less than 0.01. These correlations between ERA5 and in-situ measured variables were like those reported by Bodjrènou <xref ref-type="bibr" rid="scirp.146987-55">
      [55]
     </xref> when assessing ERA5 hydrological variables with in-situ measurements over Benin. There is also moderate to strong anti-correlation between temperature and relative humidity, indicating that the relative humidity at Lamto station tends to decrease when temperature increases, as warmer air has a greater capacity to hold water vapour than cooler air <xref ref-type="bibr" rid="scirp.146987-56">
      [56]
     </xref>.</p>
    <fig id="fig3" position="float">
     <label>Figure 3</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 3. Heat map of the Spearman correlation between the in-situ and ERA5 of daily mean air temperature at 2 m, daily minimum and maximum temperature, relative humidity at the synoptic hours 06:00 UTC, 12:00 UTC, and 18:00 UTC between 14<sup>th</sup> January 2017 and 16<sup>th</sup> February 2023.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId33.jpeg?20251105021501" />
    </fig>
    <p>Overall, the ERA5 data capture the diurnal and seasonal cycles of climate and meteorological features of Lamto. As an evaluation of ERA5 data over the Lamto station using in-situ observed data did not exist in the literature, it appeared important for us to perform this quick evaluation on the ERA5 data, as it offers the advantage of a wider range of meteorological variables needed for the use of Artificial Intelligence (AI) tools in this work.</p>
   </sec>
   <sec id="s3_2">
    <title>3.2. Exploratory Analysis</title>
    <p>
     <xref ref-type="fig" rid="fig4">
      Figure 4
     </xref> shows the time series evolution of daily PM<sub>10</sub> concentrations at the Lamto station, marked by a strong seasonal cycle, with a peak occurring during the dry season (November to March). Minimum PM<sub>10</sub> concentrations are recorded during the rainy season (April to October). In contrast to a bimodal rainfall pattern observed at Lamto, the PM<sub>10</sub> concentration pattern is characterized by a single peak occurring during the dry season. Moreover, the highest PM<sub>10</sub> concentration peaks were recorded in 2018, with values reaching 888.9 μg/m<sup>3</sup> on 1<sup>st</sup> January. The year 2021 recorded relatively low PM<sub>10</sub> concentrations during the dry season compared to the other years. The dry season in Lamto is often impacted by pollutants from both local and long-range sources. During the dry season, Lamto station and surrounding areas are subject to biomass burning fires <xref ref-type="bibr" rid="scirp.146987-57">
      [57]
     </xref>, which are set by different groups of people for different reasons (research purposes, maintaining savanna landscapes, grazing and agriculture, hunting, ...). Moreover, N’Datchoh <xref ref-type="bibr" rid="scirp.146987-58">
      [58]
     </xref> showed that biomass burning is prevalent over the West African region from November to December, while analyzing satellite fire products from SPOT VEGETATION. In addition to these local and long-range sources from biomass burning activities, this region of West Africa is also reported to be impacted by dust aerosols transported from the Sahel and Saharan region to the Guinean Gulf by the Harmattan winds. During the main rainy season, minimum PM<sub>10</sub> concentrations are recorded with daily concentration values well below 50 μg/m<sup>3</sup>. Furthermore, these PM<sub>10</sub> daily concentration values maintain their lowest values during the little dry season. This little dry season in the region along the Guinean coast is often due to the WAM jump, which allows the WAM rain belt to be located over the Sahel region <xref ref-type="bibr" rid="scirp.146987-59">
      [59]
     </xref>.</p>
    <fig id="fig4" position="float">
     <label>Figure 4</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 4. Daily PM<sub>10 </sub>concentration time series, with different colours corresponding to a specific year.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId34.jpeg?20251105021502" />
    </fig>
    <p>
     <xref ref-type="table" rid="table3">
      Table 3
     </xref> summarizes the descriptive statistics for the raw PM<sub>10</sub> database at Lamto. A total of 2225 days were analysed. An average of daily PM<sub>10</sub> concentrations of about 42.79 μg/m<sup>3</sup> is associated with a very high standard deviation of about 59.5 μg/m<sup>3</sup>, as well as a median of 22.15 μg/m<sup>3</sup>, indicating a high variability and lack of balance in PM<sub>10</sub> concentrations in Lamto. This type of distribution, asymmetrical and spread out towards the high values, reflects the presence of occasional high pollution events.</p>
    <table-wrap id="table2">
     <label>
      <xref ref-type="table" rid="table2">
       Table 2
      </xref></label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Table 3. Daily PM<sub>10</sub> concentration at Lamto dataset basic statistics overview between 2017 and 2023.</title>
     </caption>
     <table class="MsoTableGrid custom-table" border="0" cellspacing="0" cellpadding="0"> 
      <tr> 
       <td class="custom-bottom-td acenter" width="50.00%"><p style="text-align:center">Parameter</p></td> 
       <td class="custom-bottom-td acenter" width="50.00%"><p style="text-align:center">Values (μg/m³)</p></td> 
      </tr> 
      <tr> 
       <td class="custom-top-td acenter" width="50.00%"><p style="text-align:center">Mean</p></td> 
       <td class="custom-top-td acenter" width="50.00%"><p style="text-align:center">42.79</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.00%"><p style="text-align:center">Standard deviation</p></td> 
       <td class="acenter" width="50.00%"><p style="text-align:center">59.49</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.00%"><p style="text-align:center">Minimum</p></td> 
       <td class="acenter" width="50.00%"><p style="text-align:center">7.31</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.00%"><p style="text-align:center">First quartile</p></td> 
       <td class="acenter" width="50.00%"><p style="text-align:center">16.35</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.00%"><p style="text-align:center">Median</p></td> 
       <td class="acenter" width="50.00%"><p style="text-align:center">22.15</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.00%"><p style="text-align:center">Third quartile</p></td> 
       <td class="acenter" width="50.00%"><p style="text-align:center">43.55</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="50.00%"><p style="text-align:center">Maximum</p></td> 
       <td class="acenter" width="50.00%"><p style="text-align:center">888.90</p></td> 
      </tr> 
     </table>
    </table-wrap>
   </sec>
   <sec id="s3_3">
    <title>3.3. Decomposition of the PM<sub>10</sub> Time Series</title>
    <p>
     <xref ref-type="fig" rid="fig4">
      Figure 4
     </xref> presents the original PM<sub>10</sub> concentration time series (<xref ref-type="fig" rid="fig5(a)">
      Figure 5(a)
     </xref>) and its decomposition into trend (<xref ref-type="fig" rid="fig5(b)">
      Figure 5(b)
     </xref>), seasonality (<xref ref-type="fig" rid="fig5(c)">
      Figure 5(c)
     </xref>), noise (<xref ref-type="fig" rid="fig5(d)">
      Figure 5(d)
     </xref>), and their transformation into a logarithmic function (<xref ref-type="fig" rid="figFigures 5(e)-(h)">
      Figures 5(e)-(h)
     </xref>). The logarithmic function was applied to the daily PM<sub>10</sub> concentration for the purpose of smoothing and attenuating the existing high variability observed in the data, making variation easier to analyse, as suggested by Hyndman and Athanasopoulos <xref ref-type="bibr" rid="scirp.146987-60">
      [60]
     </xref>. The overall trend (<xref ref-type="fig" rid="fig5(b)">
      Figure 5(b)
     </xref> and <xref ref-type="fig" rid="fig5(f)">
      Figure 5(f)
     </xref>) exhibits phases of high and low daily PM<sub>10</sub> concentrations, which are the result of complex interactions between environmental, climatic, and meteorological factors as well as human activities. A comparison between the original (<xref ref-type="fig" rid="fig5(b)">
      Figure 5(b)
     </xref>) and logarithmic function (<xref ref-type="fig" rid="fig5(f)">
      Figure 5(f)
     </xref>) shows a smoothing, allowing detection of changes that are crucial in the use of linear models. The seasonal decomposition (<xref ref-type="fig" rid="fig5(c)">
      Figure 5(c)
     </xref> and <xref ref-type="fig" rid="fig5(g)">
      Figure 5(g)
     </xref>) shows the seasonal cycle in the daily PM<sub>10</sub> concentrations, which are dominated by higher values of daily PM<sub>10</sub> concentration during the dry season compared to the wet season. Here, the use of the logarithmic transformation allows smoothing of the seasonal cycle while capturing the annual and seasonal cycles. Residual or noise components (<xref ref-type="fig" rid="fig5(d)">
      Figure 5(d)
     </xref> and <xref ref-type="fig" rid="fig5(h)">
      Figure 5(h)
     </xref>) characterize all daily PM<sub>10</sub> concentration data, which cannot be explained either by trend or seasonality. Since SARIMA needs stability to provide accurate results in terms of its output, the logarithmic transformation allows smoothing of the data and facilitates its machine learning process, which can be affected by very high values such as extreme events <xref ref-type="bibr" rid="scirp.146987-61">
      [61]
     </xref>. The presence of structured trends and well-defined seasonality favored the use of classical models such as SARIMAX, which can take explicit account of such trend and seasonality. However, the unpredictable nature of certain variations and the possible non-linear interactions between daily PM<sub>10</sub> concentration and meteorological variables favoured the consideration of more flexible machine learning models, such as XGBoost, Random Forest, or LightGBM. These latter models are known for their robustness in dealing with noisy and highly variable data and their ability to capture complex relationships <xref ref-type="bibr" rid="scirp.146987-62">
      [62]
     </xref> between variables.</p>
    <fig id="fig5" position="float">
     <label>Figure 5</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 5. Time series of PM<sub>10</sub> concentrations and logarithmic transformations (log): Original ((a) and (e)), Trend ((b) and (f)), Seasonality ((c) and (g)), and Noise ((d) and (h)).</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId35.jpeg?20251105021502" />
    </fig>
    <p>A Shapiro-Wilk test recommended for moderate to large samples was conducted in order to check whether the daily PM<sub>10</sub> follows a normal distribution. The Shapiro-Wilk test results reveal that all the variables considered here deviated significantly from normality, with a very low statistic for PM<sub>10</sub> (W = 0.51) and a p-value close to zero (≈1.12 × 10<sup>−</sup><sup>59</sup>) (W = 0.51) and a p-value close to zero (≈1.12 × 10, implying that classic parametric tests were less appropriate for this work. Therefore, a non-parametric Kruskal-Wallis test was conducted to check monthly and yearly variability significance in the daily PM<sub>10</sub> dataset. This allows confirmation of the existence of strong monthly variability and seasonality of all variables considered. An ADF (Augmented Dickey-Fuller) stationarity test, which is a must for any time series study <xref ref-type="bibr" rid="scirp.146987-63">
      [63]
     </xref>, was conducted. These test results indicate that the time series are stationary, meaning that their statistical properties (mean, variance) remain constant over time.</p>
    <p>
     <xref ref-type="fig" rid="fig6">
      Figure 6
     </xref> presents the seasonal pattern for PM10 concentration climatology between 2017 and 2023.</p>
    <fig id="fig6" position="float">
     <label>Figure 6</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 6. Boxplots showing the seasonal pattern of PM<sub>10</sub> concentrations from 2017 to 2023.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId36.jpeg?20251105021503" />
    </fig>
   </sec>
   <sec id="s3_4">
    <title>3.4. Explanatory Variables</title>
    <p>The final selection of explanatory variables and their optimal lags is presented in <xref ref-type="table" rid="table4">
      Table 4
     </xref>. Time lags of 1 to 3 days [PM<sub>10</sub>(t-1), PM<sub>10</sub>(t-2), PM<sub>10</sub>(t-3)] were included as additional explanatory variables. This decision was motivated by two preliminary analyses. (i) An examination of the autocorrelation (ACF) and partial autocorrelation (PACF) functions revealed significant dependence up to a lag of three days. (ii) A comparative performance evaluation showed that adding lags beyond 3 days lag (d-3) did not significantly improve RMSE and R<sup>2</sup> metrics, while increasing the risk of overfitting. This choice is also consistent with several previous work <xref ref-type="bibr" rid="scirp.146987-64">
      [64]
     </xref> that have demonstrated the significant contribution of delayed PM₁₀ values in predicting future concentrations. To avoid any leakage of information from the future to the past, which would distort the predictions, a breakdown of the time series into two sets was performed: the training data (Train) covers the period from 14 January 2017 to 28 November 2021, i.e., 1780 days, and the test data runs from 29 November 2021 to 16 February 2023, representing 445 days. This breakdown respects the natural temporal logic of the series, a fundamental criterion in the context of forecasting. This breakdown can be seen in<xref ref-type="fig" rid="fig7">
      Figure 7
     </xref>. <xref ref-type="fig" rid="fig7(a)">
      Figure 7(a)
     </xref> shows the separation of the daily PM10 concentration series into train (blue color) and test before filling the missing values. <xref ref-type="fig" rid="fig7(b)">
      Figure 7(b)
     </xref> shows the daily PM<sub>10</sub> concentration with the missing values filled using the median of similar days in previous and following years to consider the strong seasonality observed in the dataset. For example, the missing values on 10 July 2019 are interpolated using the median for 10 July in 2017, 2018, 2020, etc. This method inspired by the work of Weed <xref ref-type="bibr" rid="scirp.146987-65">
      [65]
     </xref> makes it possible to retain seasonal effects without introducing time distortion. Although this method is not the most common in the literature, it is based on a simple and solid logic, which takes advantage of seasonal repeatability from one year to the next. It is particularly well suited to environmental data, where seasonal effects are often very marked.</p>
    <table-wrap id="table3">
     <label>
      <xref ref-type="table" rid="table3">
       Table 3
      </xref></label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Table 4. Explanatory variables and optimal time lags used in this work.</title>
     </caption>
     <table class="MsoTableGrid custom-table" border="0" cellspacing="0" cellpadding="0"> 
      <tr> 
       <td class="custom-bottom-td acenter" width="22.79%"><p style="text-align:center">Variables</p></td> 
       <td class="custom-bottom-td acenter" width="63.30%"><p style="text-align:center">Full name of the variables</p></td> 
       <td class="custom-bottom-td acenter" width="13.91%"><p style="text-align:center">Time lag</p></td> 
      </tr> 
      <tr> 
       <td class="custom-top-td acenter" width="22.79%"><p style="text-align:center">var18_swvl1</p></td> 
       <td class="custom-top-td acenter" width="63.30%"><p style="text-align:center">Soil water content-surface layer</p></td> 
       <td class="custom-top-td acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var5_mx2t</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Maximum temperature at 2 m</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var6_tcwv</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Total precipitable water in the air column</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">Month</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Month of the year</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var14_slhf</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Latent surface heat flux</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var11_msl</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Atmospheric pressure at mean sea level</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var8_blh</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Height of the atmospheric boundary layer</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var3_tcc</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Total cloud cover</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">6 days</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var4_d2m_C</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Dew point temperature at 2 m</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">var7_avg_snswrf</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">Net short-wave solar flux at the surface</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">2 days</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">PM10_lag1</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">PM<sub>10</sub> surface concentration of the previous day</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">1 day</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">PM10_lag2</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">PM<sub>10</sub> surface concentration of the two previous days</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">2 days</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="22.79%"><p style="text-align:center">PM10_lag3</p></td> 
       <td class="acenter" width="63.30%"><p style="text-align:center">PM<sub>10</sub> surface concentration of the 3 previous days</p></td> 
       <td class="acenter" width="13.91%"><p style="text-align:center">3 days</p></td> 
      </tr> 
     </table>
    </table-wrap>
    <fig id="fig7" position="float">
     <label>Figure 7</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 7. Daily PM<sub>10</sub> surface concentration breakdown into train from 14<sup>th</sup> January 2017 to 28<sup>th</sup> November 2021 (1780 days) and test runs from 29<sup>th</sup> November 2021 to 16<sup>th</sup> February 2023 (445 days) for (a) original data and (b) missing data fill-up.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId37.jpeg?20251105021503" />
    </fig>
    <p>To handle missing values in daily PM₁₀ concentrations, we used the median of observations from the same calendar day in other years of the study. This method was selected for its proven ability to preserve the temporal characteristics of time series. However this way of handling the missing data may potentially bias the model training by reducing the natural variance of the data and smoothing out actual pollution peaks. This may lead the model to underestimate the amplitude of surface PM<sub>10</sub> concentration peaks during high pollution events. As a result, test errors could be underestimated during validation, as the model would be evaluated on smoothed data that does not fully reflect the diversity and intensity of the observed conditions, which could limit its ability to generalize to new data.</p>
   </sec>
   <sec id="s3_5">
    <title>3.5. Separation of Time Series and Handling of Missing Values</title>
    <p>To assess the reliability and ability of the Machine Learning models to generalize well the predictions of PM<sub>10</sub> concentrations, a cross-validation was done. The model was trained on past data to make predictions about a future period, without ever using information from the future. Three models were used, namely Random Forest, XGBoost, and LightGBM. For each model, performance was measured using the root mean square error (RMSE). Mean errors obtained are summarized in <xref ref-type="table" rid="table3">
      Table 3
     </xref>, highlighting that the Random Forest model performs better, with an average RMSE of 15.94. It is closely followed by LightGBM (16.44), then XGBoost (17.03). These scores indicate that Random Forest seems to better capture the dynamics of the daily PM<sub>10</sub> concentration, while remaining stable across the different periods tested. However, the SARIMAX model was not included in this cross-validation. The SARIMAX model relies heavily on the temporal dependence between observations, and therefore was evaluated separately, using a simple chronological breakdown between training and testing.</p>
   </sec>
   <sec id="s3_6">
    <title>3.6. Final Evaluation and Model Performance</title>
    <p>
     <xref ref-type="fig" rid="fig8">
      Figure 8
     </xref> shows the original (blue) and predicted time series modelled (orange) by daily PM<sub>10</sub> surface concentrations from January 2022 to March 2023 for SARIMAX (<xref ref-type="fig" rid="fig8(a)">
      Figure 8(a)
     </xref>), Random Forest (<xref ref-type="fig" rid="fig8(b)">
      Figure 8(b)
     </xref>), XGBoost (<xref ref-type="fig" rid="fig8(c)">
      Figure 8(c)
     </xref>), and LightGBM (<xref ref-type="fig" rid="fig8(d)">
      Figure 8(d)
     </xref>). The hyperparameters used for each model are presented in the supplementary material (<xref ref-type="table" rid="tableS1">
      Table S1
     </xref>). It should be noted, that no performance optimisation tests were carried out on in this present work. We used default configurations for each of the models. Overall, all four models were able to capture the general trend of the PM<sub>10</sub> surface concentration in Lamto. However, a close analysis of <xref ref-type="fig" rid="fig8">
      Figure 8
     </xref> reveals some slight differences between the models themselves and between the models and the in-situ observations. For example, the PM<sub>10</sub> concentrations range from 10.19 (minimum) to 210.01 (maximum) µg/m<sup>3</sup> for the SARIMAX model, 10.48 (minimum) to 171.88 (maximum) µg/m<sup>3</sup> for the Random Forest model, 12.47 (minimum) to 190.37 (maximum) µg/m<sup>3</sup> for the XGBoost model, and 11.68 (minimum) to 171.20 (maximum) µg/m<sup>3</sup> for the LightGBM model, while the observations are within 8.00 (minimum) and 266.57 (maximum) µg/m<sup>3</sup>. All the models tend to overestimate the PM<sub>10</sub> minimum concentration, while they underestimate the maximum compared to the observations. Moreover, all models tend to slightly overestimate PM<sub>10</sub> concentrations compared to observations during the wet season. Furthermore, in terms of capturing the high variability in PM<sub>10</sub> concentration peaks associated with pollution events, some slight lags seem to be produced in all the models except the Random Forest, which seems</p>
    <fig id="fig8" position="float">
     <label>Figure 8</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 8. Original (blue) and predicted (orange) time series simulated by the (a) SARIMAX, (b) Random Forest, (c) XGBoost, and (d) LightGBM models of daily PM<sub>10</sub> surface concentrations from January 2022 to March 2023.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId38.jpeg?20251105021504" />
    </fig>
    <table-wrap id="table4">
     <label>
      <xref ref-type="table" rid="table4">
       Table 4
      </xref></label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Table 5. Statistical indicators RMSE, MAE, and R<sup>2</sup> provided at annual and seasonal time scales for each of the four models used in this study.</title>
     </caption>
     <table class="MsoTableGrid custom-table" border="0" cellspacing="0" cellpadding="0"> 
      <tr> 
       <td class="custom-bottom-td acenter" width="34.13%"><p style="text-align:center"></p></td> 
       <td class="custom-bottom-td acenter" width="16.46%"><p style="text-align:center">Random forest</p></td> 
       <td class="custom-bottom-td acenter" width="16.46%"><p style="text-align:center">XGBoost</p></td> 
       <td class="custom-bottom-td acenter" width="16.46%"><p style="text-align:center">LightGBM</p></td> 
       <td class="custom-bottom-td acenter" width="16.47%"><p style="text-align:center">SARIMAX</p></td> 
      </tr> 
      <tr> 
       <td class="custom-top-td acenter" width="34.13%"><p style="text-align:center">RMSE (μg/m<sup>3</sup>)</p></td> 
       <td class="custom-top-td acenter" width="16.46%"><p style="text-align:center">23.12</p></td> 
       <td class="custom-top-td acenter" width="16.46%"><p style="text-align:center">24.31</p></td> 
       <td class="custom-top-td acenter" width="16.46%"><p style="text-align:center">23.70</p></td> 
       <td class="custom-top-td acenter" width="16.47%"><p style="text-align:center">28.52</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">MAE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">12.35</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">13.23</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">12.78</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">16.52</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">R<sup>2</sup></p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.78</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.75</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.76</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">0.64</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Main dry season RMSE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">33.98</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">35.41</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">35.66</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">39.93</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Main dry season MAE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">22.38</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">23.28</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">24.08</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">29.84</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Main dry season R<sup>2</sup></p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.61</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.58</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.57</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">0.46</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Main wet season RMSE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">7.79</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">8.11</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">7.98</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">16.31</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Main wet season MAE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">5.20</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">5.46</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">5.36</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">12.99</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Main wet season R<sup>2</sup></p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.73</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.71</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.72</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">−0.18</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Little dry season RMSE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">4.82</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">4.81</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">5.13</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">17.97</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Little dry season MAE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">4.02</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">3.96</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">4.38</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">15.67</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Little dry season R<sup>2</sup></p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.13</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.13</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.01</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">−2.81</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Little wet season RMSE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">3.58</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">3.68</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">3.72</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">8.47</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Little wet season MAE (μg/m<sup>3</sup>)</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">2.65</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">2.87</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">2.90</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">6.94</p></td> 
      </tr> 
      <tr> 
       <td class="acenter" width="34.13%"><p style="text-align:center">Little wet season R<sup>2</sup></p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.32</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.28</p></td> 
       <td class="acenter" width="16.46%"><p style="text-align:center">0.26</p></td> 
       <td class="acenter" width="16.47%"><p style="text-align:center">−11.11</p></td> 
      </tr> 
     </table>
    </table-wrap>
    <p>to follow more closely. Therefore, it appears necessary to evaluate the performances of the different models that are measured using indicators such as RMSE, MAE, and R<sup>2</sup>. These indicators are summarized in <xref ref-type="table" rid="table5">
      Table 5
     </xref> for the entire predicted timeseries but also per season. From <xref ref-type="table" rid="table5">
      Table 5
     </xref>, it can be seen that the SARIMAX model is the least performant model with a limited capacity to capture changes in the daily PM<sub>10</sub> concentrations at Lamto, as it scored lower performance, with a RMSE of 28.52 μg/m<sup>3</sup>, a MAE of 16.52 μg/m<sup>3</sup>, and a R<sup>2</sup> of 0.64. These relatively poor scores underline that the present models (Random Forest, XGBoost, LightGBM, and SARIMAX) have poor capacity in reproducing daily PM<sub>10</sub> surface concentration, which may be explained by its high variance and the complex interaction between meteorology, local, and long-range factors that influence the PM<sub>10</sub> loaded in the Lamto atmosphere. PM<sub>10</sub> concentrations in Lamto are influenced by complex non-linear phenomena as well as irregular exogenous factors, which are difficult to model within a purely statistical framework.</p>
    <p>Conversely, the Machine Learning models show a potential possibility to be adapted and to integrate complex atmospheric processes involving local and long-range factors under the condition of providing good and robust observations, which may be used to train and test them. Therefore, the Random Forest model scored a better overall performance with an RMSE of 23.12 μg/m<sup>3</sup>, an MAE of 12.35 μg/m<sup>3</sup>, and an R<sup>2</sup> of 0.78. Furthermore, an RMSE of 23.12 indicates an average prediction error of 23.12 μg/m<sup>3</sup> compared with the actual values, while an MAE of 12.35 underlines that the average absolute difference between the predicted and observed values is 12.35 μg/m<sup>3</sup>. The coefficient of determination R<sup>2</sup> = 0.78 indicates that 78% of the variability in the daily PM<sub>10</sub> surface concentrations may be explained by the model, which is satisfactory but also suggests margins of error. Therefore, in general, the pattern of the daily PM<sub>10</sub> concentration is better reproduced by the random forest, despite some bias. For example, the predicted PM<sub>10</sub> values during the dry season (November to March) are less important than those observed. These biases are associated with specific events of PM<sub>10</sub> pollution, which are more frequent during the dry season. The relatively low daily PM<sub>10</sub> surface concentration during the wet season is quite well reproduced in both pattern and magnitude, highlighting the ability of machine learning to better assimilate periods characterized by weak changes.</p>
    <p>Variables permutation importance for the Random Forest, LightGBM, and XGBoost are shown in <xref ref-type="fig" rid="fig9">
      Figure 9
     </xref>. This post-modeling analysis confirms the relevance of preliminary selection of variables based on mutual information and cross-correlation. The results of that PM10_lag1 predominance highlights a temporal self-dependence as the predominant mechanism in predicting PM<sub>10 </sub>surface concentration in Lamto. Also, the PM10_lag2 and PM10_lag3 delays confirm this multi-day persistence, may be related to the dry season where rainfall is less frequent, less washout of atmosphere occurring and more pollutant particularly PM<sub>10</sub> holds into atmosphere. When considering, meteorological variables, boundary layer height (var8_blh_lag1), humidity (var4_d2m_C_lag1), temperature (var5_mx2t_lag1), and latent heat flux (var14_slhf_lag1) emerge as consistent secondary modulators, influencing vertical dispersion, hygroscopic particle growth, convection, and turbulence, respectively. Finally, the Month_lag1 variable robustly captures the seasonality documented in Lamto. This multi-model analysis validates both the robustness of the predictors and the complementarity of our variable selection approaches. Finally, because of the SARIMAX model’s structure, variable permutation is not possible; therefore, permutation importance could not be computed and was excluded from this analysis.</p>
    <fig id="fig9" position="float">
     <label>Figure 9</label>
     <caption>
      <title>
       <xref ref-type="bibr" rid="scirp.146987-"></xref>Figure 9. Variables permutation importance for (a) Random Forest; (b) XGBoost; and (c) LghtGBM.</title>
     </caption>
     <graphic mimetype="image" position="float" xlink:type="simple" xlink:href="https://html.scirp.org/file/2430341-rId39.jpeg?20251105021504" />
    </fig>
   </sec>
   <sec id="s3_7">
    <title>3.7. Discussion</title>
    <p>This work focused on the use of Machine Learning (ML) tools for predicting PM<sub>10</sub> concentrations. To achieve this goal, the methodology applied consisted of four ML models, namely SARIMAX, Random Forest, XGBoost, and LightGBM models, to train them over 80% of the total filtered PM<sub>10</sub> data length. The remaining 20% of the observed PM<sub>10</sub> data was used for testing the model outputs. The Random Forest was identified as the best-performing model among these four models, with estimated biases of 23.12 µg/m<sup>3</sup>. These observed biases between original and predicted daily PM<sub>10</sub> surface concentration at Lamto may be explained, on the one hand, by the complex mixture of sources influencing its chemical composition <xref ref-type="bibr" rid="scirp.146987-22">
      [22]
     </xref> <xref ref-type="bibr" rid="scirp.146987-26">
      [26]
     </xref> <xref ref-type="bibr" rid="scirp.146987-40">
      [40]
     </xref>. Lamto chemical composition is the result of a combination of local (biomass burning, domestic fires, biogenic emission, ...) and remote (long-range transport of dust from the Northern Hemisphere of Africa during the dry season, biomass burning, sea salt, ...). The dry season months are characterized by high variability in pollution events, as all local and long-range transport of Sahel and Saharan dust transportation toward the Guinean Gulf <xref ref-type="bibr" rid="scirp.146987-66">
      [66]
     </xref> are also prevalent. On the other hand, biases observed between ERA5 and the in-situ measurement may have contributed to all models underestimating pollutant events maxima. A combination of in-situ measurement (when these are available) and ERA5 data for the machine learning models may contribute to reducing these observed maxima underestimations observed in all models used. Thus, this low performance of the model during the dry season may be related to the high variability in daily PM<sub>10</sub>, which contributes directly to the increase in model error and cold biases observed with the ERA5 meteorological temperature variables. During the wet season, the washout of the atmosphere by rain contributes to fewer high air pollution events, thus PM<sub>10</sub> loads into the atmosphere. This led to the higher scores observed by all models, especially the Random Forest. This finding highlights the current difficulties and limitations of applying logical tools such as mathematics through modelling to complex environmental processes involving meteorology and climate, which are highly impacted by human socio-economic activities such as air pollution. Arowosegbe <xref ref-type="bibr" rid="scirp.146987-67">
      [67]
     </xref> used Random Forest models to impute missing daily PM<sub>10</sub> concentrations in South Africa between 2010 and 2017 using spatio-temporal predictors including meteorological variables, land cover, elevation, and proximity to roads. They found an average R<sup>2</sup> of 0.78 at the national level, 0.70 at the provincial level, and 0.55 at the level of each site, thus demonstrating the effectiveness of the Random Forest model in an African context despite the scarcity of data. The temporal component of the national models explained up to 78% of the variability in concentrations. Moreover, Adnane <xref ref-type="bibr" rid="scirp.146987-68">
      [68]
     </xref> in Morocco used Nonlinear Autoregressive Neural Networks with Exogenous Inputs (NARX) models to predict hourly PM<sub>10</sub> concentrations in Agadir, at 1 h and 24 h horizons. The best results were obtained with the 24h horizon model, combining meteorological variables and secondary pollutants (CO, SO<sub>2</sub>, O<sub>3</sub>) as inputs. The model achieved a correlation coefficient of 93.75%, i.e., an approximate R<sup>2</sup> of 0.88, illustrating the added value of pollution data combined with meteorological variables in improving predictive performance.</p>
    <p>As hybrid models have been reported to have better performance for environmental monitoring policy and decision-making <xref ref-type="bibr" rid="scirp.146987-35">
      [35]
     </xref> <xref ref-type="bibr" rid="scirp.146987-36">
      [36]
     </xref>, such methods need to be evaluated in the limited data context of sub-Saharan Africa. As AI is emerging as a necessary transversal tool in many research areas, the African continent must integrate such a tool in environmental process monitoring and management. Applying AI to their AirQo low-cost sensors in Africa, Bainomugisha <xref ref-type="bibr" rid="scirp.146987-69">
      [69]
     </xref> highlighted a set of digital solutions for the environmental air pollution challenges from custom-designed low-cost air quality monitors, deployment methodology, AI-powered digital tools, and a framework for citizens’ and leaders’ engagement. Finally, leveraging AI and data science to mitigate the respiratory health impacts in the context of climate change in Africa, Sowunmi <xref ref-type="bibr" rid="scirp.146987-70">
      [70]
     </xref> emphasized pilot AI-driven health monitoring systems in major cities with clear indicators, such as improved weather forecasts, reductions in respiratory symptoms or hospitalizations, and improved healthcare access.</p>
   </sec>
  </sec><sec id="s4">
   <title>4. Conclusions</title>
   <p>Daily PM<sub>10</sub> surface concentrations in Lamto over seven years (2017-2023) were investigated using a machine learning tool. To achieve this, firstly, the ERA5 daily data were assessed with in-situ measurements recorded at the Lamto station. This assessment shows that, despite some biases, ERA5 can reproduce a fairly diurnal cycle of temperature and relative humidity for Lamto. Good and strong correlations (r varying from 0.48 to 0.73) are found between the ERA5 and in-situ measurements of temperature variables. Also, moderate correlations (0.22 to 0.65) exist between the relative humidity variables of these two datasets.</p>
   <p>Using 25 meteorological variables from daily ERA5 and PM<sub>10</sub> surface concentration, we applied machine learning to 80% (14<sup>th</sup> January 2017 to 28<sup>th</sup> November 2021, i.e., 1780 days) of the daily PM<sub>10</sub> surface concentration to train four machine learning models (SARIMAX, Random Forest model, XGBoost, and LightGBM), while 20% (from 1<sup>st</sup> January 2022 to March 2023, i.e., 445 days) were used to validate their predictions. All the models reasonably reproduced trends and patterns of PM<sub>10</sub> daily concentration compared to the in-situ observations, despite some biases. These biases consisted of a slight overestimation of the daily PM<sub>10</sub> concentration during the wet season, while underestimating high pollution days during the dry season. The performances of these four machine learning models were evaluated using indicators such as RMSE, MAE, and R<sup>2</sup>. The Random Forest model achieved an R<sup>2</sup> of 0.78 and an RMSE of 23 μg/m<sup>3</sup>, surpassing the performance of the SARIMAX model (R<sup>2</sup> of 0.64 and an RMSE of 28.54 μg/m<sup>3</sup>), XGBOOST (R<sup>2</sup> of 0.74 and an RMSE of 24.54 μg/m<sup>3</sup>), and LightGBM (R<sup>2</sup> of 0.76 and an RMSE of 23.70 μg/m<sup>3</sup>). This model’s performance helped identify the Random Forest as the best performing model in reproducing the daily PM<sub>10</sub> surface concentration at Lamto. This performance was better during the wet season, when daily PM<sub>10</sub> presents less variability with low pollution levels. Despite the high variability associated with pollution events depending on local and remote factors, the pattern was captured despite a lower high pollution magnitude. Moreover, the low performance of the machine learning models during the dry season may be related to this high variability in daily PM<sub>10</sub> and biases observed with ERA5 meteorological data, though we did not investigate the error sources and their impacts on the work. Future work will focus on the contribution of bias correction into ERA5 as well as the combination of models to improve the machine learning model performance in capturing environmental processes over Lamto and other places of the country and the continent.</p>
  </sec><sec id="s5">
   <title>Acknowledgements</title>
   <p>The authors would like to acknowledge the INDAAF (International Network to study Deposition and Atmospheric chemistry in Africa) project. INDAAF is supported by the INSU (Institut National des Sciences de l'Univers)/CNRS (Centre National de la Recherche Scientifique), IRD (Institut de Recherche pour le Développement) and the research infrastructure ACTRIS-FR registered on the Roadmap of the French Ministry of Research. We also express our gratitude to all INDAAF local technicians for their maintenance and sampling work. We would also like to thank the JEAI PATI (Jeune Equipe Associée de l’IRD Physico-chimie Atmosphérique et Impacts) project under the sponsorship of the IRD for their generous financial support in the publication of this article.</p>
  </sec><sec id="s6">
   <title>Data Availability</title>
   <p>The INDAAF data can be retrieved from the website <xref ref-type="bibr" rid="scirp.146987-https://indaaf.obs-mip.fr/">
     https://indaaf.obs-mip.fr/
    </xref>. Interested persons may contact corinne.galy-lacaux@aero.obs-mip.fr or beatrice.marticorena@lisa.ipsl.fr for these data.</p>
  </sec><sec id="s7">
   <title>Author Contributions</title>
   <p>Conceptualization and methodology, N.E.T., M.G.O., and C.E.; Analysis experience, N.E.T., M.G.O., C.E., and A.B.; writing—original draft preparation, N.E.T., M.G.O., A.B., C.E., K.K., F.Y., M.D., M.L.D., G.N.S.K., and V.Y.; writing—review and editing, N.E.T., M.G.O., A.B., C.E., K.K., F.Y., M.D., M.L.D., G.N.S.K. All authors have read and agreed to the published version of the manuscript.</p>
  </sec><sec id="s8">
   <title>Supplement Material</title>
   <table-wrap id="table5">
    <label>
     <xref ref-type="table" rid="table5">
      Table 5
     </xref></label>
    <caption>
     <title>
      <xref ref-type="bibr" rid="scirp.146987-"></xref>Table S1. Hyperparameter information used for each of the model use in this study. Note that, nosystematic investigation for hyperparameters (using grid or cross-validation) was performed, as we focused in this study on basic comparison of models with their default configuration.</title>
    </caption>
    <table class="MsoTableGrid custom-table" border="0" cellspacing="0" cellpadding="0"> 
     <tr> 
      <td class="aleft" width="14.77%"><p style="text-align:left">Model</p></td> 
      <td class="aleft" width="30.90%"><p style="text-align:left">Hyperparameter</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">Final value or setting</p></td> 
      <td class="aleft" width="38.59%"><p style="text-align:left">Reference / comment</p></td> 
     </tr> 
     <tr> 
      <td rowspan="3" class="custom-top-td acenter" width="14.77%"><p style="text-align:center">Random Forest</p></td> 
      <td class="custom-top-td acenter" width="30.90%"><p style="text-align:center">n_estimators</p></td> 
      <td class="custom-top-td acenter" width="15.74%"><p style="text-align:center">100</p></td> 
      <td class="custom-top-td acenter" width="38.59%"><p style="text-align:center">Number of trees in the forest</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">max_depth</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">10</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">Maximum depth of each tree</p></td> 
     </tr> 
     <tr> 
      <td class="custom-bottom-td acenter" width="30.90%"><p style="text-align:center">random_state</p></td> 
      <td class="custom-bottom-td acenter" width="15.74%"><p style="text-align:center">42</p></td> 
      <td class="custom-bottom-td acenter" width="38.59%"><p style="text-align:center">Reproducibility</p></td> 
     </tr> 
     <tr> 
      <td rowspan="4" class="custom-top-td acenter" width="14.77%"><p style="text-align:center">XGBoost</p></td> 
      <td class="custom-top-td acenter" width="30.90%"><p style="text-align:center">n_estimators</p></td> 
      <td class="custom-top-td acenter" width="15.74%"><p style="text-align:center">100</p></td> 
      <td class="custom-top-td acenter" width="38.59%"><p style="text-align:center">Number of boosting rounds</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">learning_rate</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">0.1</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">Learning rate</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">max_depth</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">3</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">Maximum depth of each tree</p></td> 
     </tr> 
     <tr> 
      <td class="custom-bottom-td acenter" width="30.90%"><p style="text-align:center">random_state</p></td> 
      <td class="custom-bottom-td acenter" width="15.74%"><p style="text-align:center">42</p></td> 
      <td class="custom-bottom-td acenter" width="38.59%"><p style="text-align:center">Random seed for reproducibility</p></td> 
     </tr> 
     <tr> 
      <td rowspan="5" class="custom-top-td acenter" width="14.77%"><p style="text-align:center">LightGBM</p></td> 
      <td class="custom-top-td acenter" width="30.90%"><p style="text-align:center">objective</p></td> 
      <td class="custom-top-td acenter" width="15.74%"><p style="text-align:center">regression</p></td> 
      <td class="custom-top-td acenter" width="38.59%"><p style="text-align:center">Regression task</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">metric</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">rmse</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">Evaluation function</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">boosting_type</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">gbdt</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">Type of boosting algorithm</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">num_boost_round</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">100</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">Number of learning iterations</p></td> 
     </tr> 
     <tr> 
      <td class="custom-bottom-td acenter" width="30.90%"><p style="text-align:center">early_stopping_rounds</p></td> 
      <td class="custom-bottom-td acenter" width="15.74%"><p style="text-align:center">10</p></td> 
      <td class="custom-bottom-td acenter" width="38.59%"><p style="text-align:center">Early stopping if no improvement</p></td> 
     </tr> 
     <tr> 
      <td rowspan="4" class="custom-top-td acenter" width="14.77%"><p style="text-align:center">SARIMAX</p></td> 
      <td class="custom-top-td acenter" width="30.90%"><p style="text-align:center">order (p, d, q)</p></td> 
      <td class="custom-top-td acenter" width="15.74%"><p style="text-align:center">(1, 0, 2)</p></td> 
      <td class="custom-top-td acenter" width="38.59%"><p style="text-align:center">Autoregressive and moving average components</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">seasonal_order (P, D, Q, s)</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">(2, 0, 2, 12)</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">Seasonal components (s = 12 for monthly annual cycle)</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">enforce_stationarity</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">False</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">No forcing of stationarity</p></td> 
     </tr> 
     <tr> 
      <td class="acenter" width="30.90%"><p style="text-align:center">enforce_invertibility</p></td> 
      <td class="acenter" width="15.74%"><p style="text-align:center">False</p></td> 
      <td class="acenter" width="38.59%"><p style="text-align:center">No forcing of invertibility</p></td> 
     </tr> 
    </table>
   </table-wrap>
  </sec>
 </body><back>
  <ref-list>
   <title>References</title>
   <ref id="scirp.146987-ref1">
    <label>1</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     IPCC (2001) Climate Change 2001: The Scientific Basis. Contribution of Working Group I to the Third Assessment Report of the Intergovernmental Panel on Climate Change. Cambridge University Press, 881.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref2">
    <label>2</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     IPCC (2014) Climate Change 2014: Mitigation of Climate Change. Contribution of Working Group III to the Fifth Assessment Report of the Intergovernmental Panel on Climate Change. Cambridge University Press.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref3">
    <label>3</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Lohmann, U. and Feichter, J. (2001) Can the Direct and Semi-Direct Aerosol Effect Compete with the Indirect Effect on a Global Scale? Geophysical Research Letters, 28, 159-161. &gt;https://doi.org/10.1029/2000gl012051
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref4">
    <label>4</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Nabat, P., Somot, S., Mallet, M., Michou, M., Sevault, F., Driouech, F., et al. (2015) Dust Aerosol Radiative Effects during Summer 2012 Simulated with a Coupled Regional Aerosol-Atmosphere-Ocean Model over the Mediterranean. Atmospheric Che-mistry and Physics, 15, 3303-3326. &gt;https://doi.org/10.5194/acp-15-3303-2015
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref5">
    <label>5</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Seinfeld, J.H. and Pandis, S.N. (1998) From Air Pollution to Climate Change. Atmospheric Chemistry and Physics, 1326.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref6">
    <label>6</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Knippertz, P., Coe, H., Chiu, J.C., Evans, M.J., Fink, A.H., Kalthoff, N., et al. (2015) The DACCIWA Project: Dynamics-Aerosol-Chemistry-Cloud Interactions in West Africa. Bulletin of the American Meteorological Society, 96, 1451-1460. &gt;https://doi.org/10.1175/bams-d-14-00108.1
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref7">
    <label>7</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Fiore, A.M., Naik, V. and Leibensperger, E.M. (2015) Air Quality and Climate Connections. Journal of the Air &amp; Waste Management Association, 65, 645-685. &gt;https://doi.org/10.1080/10962247.2015.1040526
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref8">
    <label>8</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Nairobi, 2022 United Nations Environment Programme.&gt;https://www.ccacoalition.org/sites/default/files/resources/files/Summary%20for%20Decision%20Makers_Integrated%20Assessment%20of%20Air%20Pollution%20and%20Climate%20Change%20for%20Sustainable%20Development%20in%20Africa.pdf 
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref9">
    <label>9</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     De Longueville, F., Hountondji, Y., Henry, S. and Ozer, P. (2010) What Do We Know about Effects of Desert Dust on Air Quality and Human Health in West Africa Compared to Other Regions? Science of the Total Environment, 409, 1-8. &gt;https://doi.org/10.1016/j.scitotenv.2010.09.025
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref10">
    <label>10</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Mir Alvarez, C., Hourcade, R., Lefebvre, B. and Pilot, E. (2020) A Scoping Review on Air Quality Monitoring, Policy and Health in West African Cities. International Journal of Environmental Research and Public Health, 17, Article 9151. &gt;https://doi.org/10.3390/ijerph17239151
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref11">
    <label>11</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Bahino, J., Giordano, M., Beekmann, M., Yoboué, V., Ochou, A., Galy-Lacaux, C., et al. (2024) Temporal Variability and Regional Influences of PM
     <sub>2.5</sub> in the West African Cities of Abidjan (Côte d’Ivoire) and Accra (Ghana). Environmental Science: Atmospheres, 4, 468-487. &gt;https://doi.org/10.1039/d4ea00012a
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref12">
    <label>12</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Djossou, J., Léon, J., Akpo, A.B., Liousse, C., Yoboué, V., Bedou, M., et al. (2018) Mass Concentration, Optical Depth and Carbon Composition of Particulate Matter in the Major Southern West African Cities of Cotonou (Benin) and Abidjan (Côte d’Ivoire). Atmospheric Chemistry and Physics, 18, 6275-6291. &gt;https://doi.org/10.5194/acp-18-6275-2018
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref13">
    <label>13</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Anand, A., Touré, N.E., Bahino, J., Gnamien, S., Hughes, A.F., Arku, R.E., et al. (2024) Low-Cost Hourly Ambient Black Carbon Measurements at Multiple Cities in Africa. Environmental Science &amp; Technology, 58, 12575-12584. &gt;https://doi.org/10.1021/acs.est.4c02297
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref14">
    <label>14</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Gnamien, S., Liousse, C., Keita, S., Silué, S., Bahino, J., Gardrat, E., et al. (2023) Chemical Characterization of Urban Aerosols in Abidjan and Korhogo (Côte d’Ivoire) from 2018 to 2020 and the Identification of Their Potential Emission Sources. Environmental Science: Atmospheres, 3, 1741-1757. &gt;https://doi.org/10.1039/d3ea00131h
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref15">
    <label>15</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Silué, S., Kouassi, A.A., N’datchôh, E.T. and Yoboué, V. (2021) Meteorological Factors Contribution over Two Urban Sites in Côte d’Ivoire. RAMReS Science des Structure de la Matiere, 3, 12-39.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref16">
    <label>16</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Léon, J., Akpo, A.B., Bedou, M., Djossou, J., Bodjrenou, M., Yoboué, V., et al. (2021) Pm
     <sub>2.5</sub> Surface Concentrations in Southern West African Urban Areas Based on Sun Photometer and Satellite Observations. Atmospheric Chemistry and Physics, 21, 1815-1834. &gt;https://doi.org/10.5194/acp-21-1815-2021
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref17">
    <label>17</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Gnamien, S., Liousse, C., Keita, S., Kumar, R. and Yoboué, V. (2024) High-resolution Modeling of Air Quality in Abidjan (Côte d’Ivoire) Using a New Urban-Scale Inventory. Atmosphere, 15, Article 758. &gt;https://doi.org/10.3390/atmos15070758
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref18">
    <label>18</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     de Coëtlogon, G., Deroubaix, A., Flamant, C., Menut, L. and Gaetani, M. (2023) Impact of the Guinea Coast Upwelling on Atmospheric Dynamics, Precipitation and Pollutant Transport over Southern West Africa. Atmospheric Chemistry and Physics, 23, 15507-15521. &gt;https://doi.org/10.5194/acp-23-15507-2023
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref19">
    <label>19</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Flamant, C., Knippertz, P., Fink, A.H., Akpo, A., Brooks, B., Chiu, C.J., et al. (2018) The Dynamics-Aerosol-Chemistry-Cloud Interactions in West Africa Field Campaign: Overview and Research Highlights. Bulletin of the American Meteorological Society, 99, 83-104. &gt;https://doi.org/10.1175/bams-d-16-0256.1
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref20">
    <label>20</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Deroubaix, A., Menut, L., Flamant, C., Brito, J., Denjean, C., Dreiling, V., et al. (2019) Diurnal Cycle of Coastal Anthropogenic Pollutant Transport over Southern West Africa during the DACCIWA Campaign. Atmospheric Chemistry and Physics, 19, 473-497. &gt;https://doi.org/10.5194/acp-19-473-2019
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref21">
    <label>21</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Niamien, A.F., Léon, J., Adon, M., Rajot, J., Feron, A. and Yoboué, V. (2024) Variability of Aerosol Optical Depth and Altitude for Key Aerosol Types over Southern West Africa via CALIPSO/CALIOP Observations. Atmosphere, 15, Article 396. &gt;https://doi.org/10.3390/atmos15040396
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref22">
    <label>22</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Ossohou, M., Galy-Lacaux, C., Yoboué, V., Hickman, J.E., Gardrat, E., Adon, M., et al. (2019) Trends and Seasonal Variability of Atmospheric NO
     <sub>2</sub> and HNO
     <sub>3</sub> Concentrations across Three Major African Biomes Inferred from Long-Term Series of Ground-Based and Satellite Measurements. Atmospheric Environment, 207, 148-166. &gt;https://doi.org/10.1016/j.atmosenv.2019.03.027
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref23">
    <label>23</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Adon, M., Galy-Lacaux, C., Yoboué, V., Delon, C., Lacaux, J.P., Castera, P., et al. (2010) Long Term Measurements of Sulfur Dioxide, Nitrogen Dioxide, Ammonia, Nitric Acid and Ozone in Africa Using Passive Samplers. Atmospheric Chemistry and Physics, 10, 7467-7487. &gt;https://doi.org/10.5194/acp-10-7467-2010
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref24">
    <label>24</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Galy-Lacaux, C., Laouali, D., Descroix, L., Gobron, N. and Liousse, C. (2009) Long Term Precipitation Chemistry and Wet Deposition in a Remote Dry Savanna Site in Africa (Niger). Atmospheric Chemistry and Physics, 9, 1579-1595. &gt;https://doi.org/10.5194/acp-9-1579-2009
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref25">
    <label>25</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Galy-Lacaux, C. and Delon, C. (2014) Nitrogen Emission and Deposition Budget in West and Central Africa. Environmental Research Letters, 9, Article ID: 125002. &gt;https://doi.org/10.1088/1748-9326/9/12/125002
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref26">
    <label>26</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Yoboué, V., Galy-Lacaux, C., Lacaux, J.P. and Silué, S. (2005) Rainwater Chemistry and Wet Deposition over the Wet Savanna Ecosystem of Lamto (Côte d’Ivoire). Journal of Atmospheric Chemistry, 52, 117-141. &gt;https://doi.org/10.1007/s10874-005-0281-z
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref27">
    <label>27</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     World Health Organization (2021) WHO Global Air Quality Guidelines: Particulate Matter (PM
     <sub>2.5</sub> and PM
     <sub>10</sub>), Ozone, Nitrogen Dioxide, Sulfur Dioxide and Carbon Monoxide. World Health Organization.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref28">
    <label>28</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     United Nations Environment Programme (2023) Integrated Assessment of Air Pollution and Climate Change for Sustainable Development in Africa. 
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref29">
    <label>29</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Lelieveld, J., Evans, J.S., Fnais, M., Giannadaki, D. and Pozzer, A. (2015) The Contribution of Outdoor Air Pollution Sources to Premature Mortality on a Global Scale. Nature, 525, 367-371. &gt;https://doi.org/10.1038/nature15371
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref30">
    <label>30</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Burnett, R., Chen, H., Szyszkowicz, M., Fann, N., Hubbell, B., Pope, C.A., et al. (2018) Global Estimates of Mortality Associated with Long-Term Exposure to Outdoor Fine Particulate Matter. Proceedings of the National Academy of Sciences of the United States of America, 115, 9592-9597. &gt;https://doi.org/10.1073/pnas.1803222115
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref31">
    <label>31</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Garbagna, L., Babu Saheer, L. and Maktab Dar Oghaz, M. (2025) AI-Driven Approaches for Air Pollution Modelling: A Comprehensive Systematic Review. Environmental Pollution, 373, Article ID: 125937. &gt;https://doi.org/10.1016/j.envpol.2025.125937
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref32">
    <label>32</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Olawade, D.B., Wada, O.Z., Ige, A.O., Egbewole, B.I., Olojo, A. and Oladapo, B.I. (2024) Artificial Intelligence in Environmental Monitoring: Advancements, Challenges, and Future Directions. Hygiene and Environmental Health Advances, 12, Article ID: 100114. &gt;https://doi.org/10.1016/j.heha.2024.100114
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref33">
    <label>33</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Zheng, T., Bergin, M., Wang, G. and Carlson, D. (2021) Local PM
     <sub>2.5</sub> Hotspot Detector at 300 M Resolution: A Random Forest-Convolutional Neural Network Joint Model Jointly Trained on Satellite Images and Meteorology. Remote Sensing, 13, Article 1356. &gt;https://doi.org/10.3390/rs13071356
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref34">
    <label>34</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Dobrea, M., Badicu, A., Barbu, M., Subea, O., Balanescu, M., Suciu, G., et al. (2020) Machine Learning Algorithms for Air Pollutants Forecasting. 2020 IEEE 26th International Symposium for Design and Technology in Electronic Packaging (SIITME), Pitesti, 21-24 October 2020, 109-113. &gt;https://doi.org/10.1109/siitme50350.2020.9292238
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref35">
    <label>35</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Subramaniam, S., Raju, N., Ganesan, A., Rajavel, N., Chenniappan, M., Prakash, C., et al. (2022) Artificial Intelligence Technologies for Forecasting Air Pollution and Human Health: A Narrative Review. Sustainability, 14, Article 9951. &gt;https://doi.org/10.3390/su14169951
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref36">
    <label>36</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Fu, L., Li, J. and Chen, Y. (2023) An Innovative Decision Making Method for Air Quality Monitoring Based on Big Data-Assisted Artificial Intelligence Technique. Journal of Innovation &amp; Knowledge, 8, Article ID: 100294. &gt;https://doi.org/10.1016/j.jik.2022.100294
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref37">
    <label>37</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Le Roux, X., Abbadie, L., Lensi, R. and Serça, D. (1995) Emission of Nitrogen Monoxide from African Tropical Ecosystems: Control of Emission by Soil Characteristics in Humid and Dry Savannas of West Africa. Journal of Geophysical Research: Atmospheres, 100, 23133-23142. &gt;https://doi.org/10.1029/95jd01923
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref38">
    <label>38</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Le Roux, X., Gauthier, H., Bégué, A. and Sinoquet, H. (1997) Radiation Absorption and Use by Humid Savanna Grassland: Assessment Using Remote Sensing and Modelling. Agricultural and Forest Meteorology, 85, 117-132. &gt;https://doi.org/10.1016/s0168-1923(97)00002-6
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref39">
    <label>39</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Abbadie, L., Gignoux, J., Roux, X. and Lepage, M. (2006) Lamto: Structure, Functioning, and Dynamics of a Savanna Ecosystem (Vol. 179). Springer Science and Business Media.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref40">
    <label>40</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Ossohou, M., Galy-Lacaux, C., Yoboué, V., Adon, M., Delon, C., Gardrat, E., et al. (2020) Long-term Atmospheric Inorganic Nitrogen Deposition in West African Savanna over 16 Year Period (Lamto, Côte d’Ivoire). Environmental Research Letters, 16, Article ID: 015004. &gt;https://doi.org/10.1088/1748-9326/abd065
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref41">
    <label>41</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     N’Dri, A.B., Gignoux, J., Dembele, A. and Konate, S. (2012) Short Term Effects of Fire Intensity and Fire Regime on Vegetation Dynamic in a Tropical Humid Savanna (Lamto, Central Côte d’Ivoire). Natural Science, 4, 1056-1064. &gt;https://doi.org/10.4236/ns.2012.412134
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref42">
    <label>42</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     N Dri, A.B. and Konan, L.N. (2018) Does the Date of Burning Affect Carbon and Nutrient Losses in a Humid Savanna of West Africa? Environment and Natural Resources Research, 8, 102-116. &gt;https://doi.org/10.5539/enrr.v8n3p102
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref43">
    <label>43</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Tiemoko, D.T., Yoroba, F., Diawara, A., Kouadio, K., Kouassi, B.K. and Yapo, A.L.M. (2020) Understanding the Local Carbon Fluxes Variations and Their Relationship to Climate Conditions in a Sub-Humid Savannah-Ecosystem during 2008-2015: Case of Lamto in Cote d’Ivoire. Atmospheric and Climate Sciences, 10, 186-205. &gt;https://doi.org/10.4236/acs.2020.102010
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref44">
    <label>44</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Tiemoko, D.T., Yoroba, F., Paris, J., Diawara, A., Berchet, A., Pison, I., et al. (2020) Source-Receptor Relationships and Cluster Analysis of CO
     <sub>2</sub>, CH
     <sub>4</sub>, and CO Concentrations in West Africa: The Case of Lamto in Côte d’Ivoire. Atmosphere, 11, Article 903. &gt;https://doi.org/10.3390/atmos11090903
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref45">
    <label>45</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Bouet, C., Yoboué, V., Marticorena, B., Rajot, J.L., Allègre, M., Féron, A., Gaimoz, C., Maisonneuve, F., Siour, G., Valorso, R., Ki, A.F., Konaté, I. and Ouattara, A. (2021) PM10 Concentration, Lamto, Côte d’Ivoire. &gt;https://doi.org/10.25326/279 
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref46">
    <label>46</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Muñoz-Sabater, J., Dutra, E., Agustí-Panareda, A., Albergel, C., Arduini, G., Balsamo, G., et al. (2021) ERA5-Land: A State-of-the-Art Global Reanalysis Dataset for Land Applications. Earth System Science Data, 13, 4349-4383. &gt;https://doi.org/10.5194/essd-13-4349-2021
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref47">
    <label>47</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Seibert, P. (2000) Review and Intercomparison of Operational Methods for the Determination of the Mixing Height. Atmospheric Environment, 34, 1001-1027. &gt;https://doi.org/10.1016/s1352-2310(99)00349-0
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref48">
    <label>48</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Petäjä, T., Järvi, L., Kerminen, V., Ding, A.J., Sun, J.N., Nie, W., et al. (2016) Enhanced Air Pollution via Aerosol-Boundary Layer Feedback in China. Scientific Reports, 6, Article No. 18998. &gt;https://doi.org/10.1038/srep18998
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref49">
    <label>49</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Stull, R.B. (2015) Practical Meteorology: An Algebra-Based Survey of Atmospheric Science. University of British Columbia Press.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref50">
    <label>50</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Volná, V. and Hladký, D. (2020) Detailed Assessment of the Effects of Meteorological Conditions on PM10 Concentrations in the Northeastern Part of the Czech Republic. Atmosphere, 11, Article 497. &gt;https://doi.org/10.3390/atmos11050497
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref51">
    <label>51</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Breiman, L. (2001) Random Forests. Machine Learning, 45, 5-32. &gt;https://doi.org/10.1023/a:1010933404324
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref52">
    <label>52</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Géron, A. (2022) Hands-On Machine Learning with Scikit-Learn, Keras, and TensorFlow. O’Reilly Media, Inc.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref53">
    <label>53</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Bergmeir, C., Hyndman, R.J. and Koo, B. (2018) A Note on the Validity of Cross-Validation for Evaluating Autoregressive Time Series Prediction. Computational Statistics &amp; Data Analysis, 120, 70-83. &gt;https://doi.org/10.1016/j.csda.2017.11.003
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref54">
    <label>54</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Schafer, J.L. and Graham, J.W. (2002) Missing Data: Our View of the State of the Art. Psychological Methods, 7, 147-177. &gt;https://doi.org/10.1037/1082-989x.7.2.147
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref55">
    <label>55</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Bodjrènou, R., Sintondji, L.O., N’Tcha, Y.M.P., Germain, D., Azonwade, F.E., Sohindji, F., et al. (2024) Assessment of Hydrologic Data Estimates from ERA5 Reanalyses in Benin, West Africa. Geoscience Data Journal, 12, e288. &gt;https://doi.org/10.1002/gdj3.288
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref56">
    <label>56</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Humphreys, W.J. (1929) Physics of the Air. McGraw-Hill Book Company.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref57">
    <label>57</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Soro, T.D., Koné, M., N’Dri, A.B. and N’Datchoh, E.T. (2021) Identified Main Fire Hotspots and Seasons in Côte d’Ivoire (West Africa) Using MODIS Fire Data. South African Journal of Science, 117, Article No. 7659. &gt;https://doi.org/10.17159/sajs.2021/7659
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref58">
    <label>58</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     N’Datchoh, E.T., Konaré, A., Diedhiou, A., Diawara, A., Quansah, E. and Assamoi, P. (2015) Effects of Climate Variability on Savannah Fire Regimes in West Africa. Earth System Dynamics, 6, 161-174. &gt;https://doi.org/10.5194/esd-6-161-2015
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref59">
    <label>59</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Sultan, B. and Janicot, S. (2003) The West African Monsoon Dynamics. Part II: The “Preonset” and “Onset” of the Summer Monsoon. Journal of Climate, 16, 3407-3427. &gt;https://doi.org/10.1175/1520-0442(2003)016&lt;3407:twamdp&gt;2.0.co;2
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref60">
    <label>60</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Hyndman, R.J. and Athanasopoulos, G. (2018) Forecasting: Principles and Practice. OTexts.
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref61">
    <label>61</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Shumway, R.H. and Stoffer, D.S. (2017) ARIMA Models. In: Shumway, R.H. and Stoffer, D.S., Eds., Time Series Analysis and Its Applications, Springer, 75-163. &gt;https://doi.org/10.1007/978-3-319-52452-8_3
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref62">
    <label>62</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Chen, T. and Guestrin, C. (2016) XGBoost: A Scalable Tree Boosting System. Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, San Francisco, 13-17 August 2016, 785-794. &gt;https://doi.org/10.1145/2939672.2939785
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref63">
    <label>63</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Dickey, D.A. and Fuller, W.A. (1979) Distribution of the Estimators for Autoregressive Time Series with a Unit Root. Journal of the American Statistical Association, 74, 427-431. &gt;https://doi.org/10.1080/01621459.1979.10482531
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref64">
    <label>64</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Taşpınar, F. (2015) Improving Artificial Neural Network Model Predictions of Daily Average PM
     <sub>10</sub> Concentrations by Applying Principle Component Analysis and Implementing Seasonal Models. Journal of the Air &amp; Waste Management Association, 65, 800-809. &gt;https://doi.org/10.1080/10962247.2015.1019652
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref65">
    <label>65</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Weed, L., Lok, R., Chawra, D. and Zeitzer, J. (2022) The Impact of Missing Data and Imputation Methods on the Analysis of 24-Hour Activity Patterns. Clocks&amp;Sleep, 4, 497-507. 
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref66">
    <label>66</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Touré, N.E., Konaré, A. and Silué, S. (2012) Intercontinental Transport and Climatic Impact of Saharan and Sahelian Dust. Advances in Meteorology, 2012, Article ID: 157020. &gt;https://doi.org/10.1155/2012/157020
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref67">
    <label>67</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Arowosegbe, O.O., Röösli, M., Künzli, N., Saucy, A., Adebayo-Ojo, T.C., Jeebhay, M.F., et al. (2021) Comparing Methods to Impute Missing Daily Ground-Level PM
     <sub>10</sub> Concentrations between 2010-2017 in South Africa. International Journal of Environmental Research and Public Health, 18, Article 3374. &gt;https://doi.org/10.3390/ijerph18073374
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref68">
    <label>68</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Adnane, A., Leghrib, R., Chaoufi, J. and Chirmata, A. (2022) Prediction of PM10 Concentrations in the City of Agadir (Morocco) Using Non-Linear Autoregressive Artificial Neural Networks with Exogenous Inputs (NARX). Materials Today: Proceedings, 52, 146-151. &gt;https://doi.org/10.1016/j.matpr.2021.11.340
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref69">
    <label>69</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Bainomugisha, E., Adrine Warigo, P., Busigu Daka, F., Nshimye, A., Birungi, M. and Okure, D. (2024) AI-Driven Environmental Sensor Networks and Digital Platforms for Urban Air Pollution Monitoring and Modelling. Societal Impacts, 3, Article ID: 100044. &gt;https://doi.org/10.1016/j.socimp.2024.100044
    </mixed-citation>
   </ref>
   <ref id="scirp.146987-ref70">
    <label>70</label>
    <mixed-citation publication-type="other" xlink:type="simple">
     Sowunmi, A.O., Eze, O.I., Osadolor, U., Iseolorunkanmi, A. and Adeloye, D. (2024) Leveraging AI and Data Science to Mitigate the Respiratory Health Impacts of Climate Change in Africa: Organisation, Costs, and Challenges. Journal of Global Health, 14, Article ID: 03051. &gt;https://doi.org/10.7189/jogh.14.03051
    </mixed-citation>
   </ref>
  </ref-list>
 </back>
</article>