<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="research-article">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">SOIL</journal-id><journal-title-group>
    <journal-title>SOIL</journal-title>
    <abbrev-journal-title abbrev-type="publisher">SOIL</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">SOIL</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">2199-398X</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/soil-7-693-2021</article-id><title-group><article-title>The central African soil spectral library: <?xmltex \hack{\break}?>a new soil infrared repository and a <?xmltex \hack{\break}?>geographical prediction analysis</article-title><alt-title>The central African soil spectral library</alt-title>
      </title-group><?xmltex \runningtitle{The central African soil spectral library}?><?xmltex \runningauthor{L.~Summerauer et al.}?>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes" rid="aff1">
          <name><surname>Summerauer</surname><given-names>Laura</given-names></name>
          <email>laura.summerauer@usys.ethz.ch</email>
        <ext-link>https://orcid.org/0000-0002-3836-653X</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Baumann</surname><given-names>Philipp</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-3194-8975</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Ramirez-Lopez</surname><given-names>Leonardo</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-5369-5120</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Barthel</surname><given-names>Matti</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3 aff4">
          <name><surname>Bauters</surname><given-names>Marijn</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5">
          <name><surname>Bukombe</surname><given-names>Benjamin</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-5135-9783</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5">
          <name><surname>Reichenbach</surname><given-names>Mario</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-4694-3579</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3">
          <name><surname>Boeckx</surname><given-names>Pascal</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4">
          <name><surname>Kearsley</surname><given-names>Elizabeth</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff6">
          <name><surname>Van Oost</surname><given-names>Kristof</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff7">
          <name><surname>Vanlauwe</surname><given-names>Bernard</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff8">
          <name><surname>Chiragaga</surname><given-names>Dieudonné</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff6">
          <name><surname>Heri-Kazi</surname><given-names>Aimé Bisimwa</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff9">
          <name><surname>Moonen</surname><given-names>Pieter</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff10">
          <name><surname>Sila</surname><given-names>Andrew</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff10">
          <name><surname>Shepherd</surname><given-names>Keith</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-7144-3915</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff11">
          <name><surname>Bazirake Mujinya</surname><given-names>Basile</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff12">
          <name><surname>Van Ranst</surname><given-names>Eric</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3">
          <name><surname>Baert</surname><given-names>Geert</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff5">
          <name><surname>Doetterl</surname><given-names>Sebastian</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-0986-891X</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Six</surname><given-names>Johan</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-9336-4185</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>Department of Environmental Systems Science, ETH Zurich, Zurich Switzerland</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>Data Science Department, BUCHI Labortechnik AG, Flawil, Switzerland</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>Department of Green Chemistry and Technology, Ghent University, Ghent, Belgium</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>Department of Environment, Ghent University, Ghent, Belgium</institution>
        </aff>
        <aff id="aff5"><label>5</label><institution>Institute of Geography, University of Augsburg, Augsburg, Germany</institution>
        </aff>
        <aff id="aff6"><label>6</label><institution>Earth and Life Institute, UCLouvain, Louvain-la-Neuve, Belgium</institution>
        </aff>
        <aff id="aff7"><label>7</label><institution>International Institute of Tropical Agriculture, Nairobi, Kenya</institution>
        </aff>
        <aff id="aff8"><label>8</label><institution>International Institute of Tropical Agriculture, Bukavu, Democratic Republic of Congo</institution>
        </aff>
        <aff id="aff9"><label>9</label><institution>Department of Earth and Environmental Sciences, KU Leuven, Leuven, Belgium</institution>
        </aff>
        <aff id="aff10"><label>10</label><institution>World Agroforestry Centre, Nairobi, Kenya</institution>
        </aff>
        <aff id="aff11"><label>11</label><institution>Department of General Agricultural Sciences, University of Lubumbashi, Lubumbashi, <?xmltex \hack{\break}?>Democratic Republic of Congo</institution>
        </aff>
        <aff id="aff12"><label>12</label><institution>Department of Geology, Ghent University, Ghent, Belgium</institution>
        </aff>
      </contrib-group>
      <author-notes><corresp id="corr1">Laura Summerauer (laura.summerauer@usys.ethz.ch)</corresp></author-notes><pub-date><day>26</day><month>October</month><year>2021</year></pub-date>
      
      <volume>7</volume>
      <issue>2</issue>
      <fpage>693</fpage><lpage>715</lpage>
      <history>
        <date date-type="received"><day>18</day><month>December</month><year>2020</year></date>
           <date date-type="rev-request"><day>8</day><month>January</month><year>2021</year></date>
           <date date-type="rev-recd"><day>4</day><month>August</month><year>2021</year></date>
           <date date-type="accepted"><day>17</day><month>August</month><year>2021</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2021 Laura Summerauer et al.</copyright-statement>
        <copyright-year>2021</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021.html">This article is available from https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021.html</self-uri><self-uri xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021.pdf">The full text article is available as a PDF file from https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021.pdf</self-uri>
      <abstract><title>Abstract</title>
    <?pagebreak page694?><p id="d1e347">Information on soil properties is crucial for soil preservation, the improvement of food security, and the provision of ecosystem services. In particular, for the African continent, spatially explicit information on soils and their ability to sustain these services is still scarce. To address data gaps, infrared spectroscopy has achieved great success as a cost-effective solution to quantify soil properties in recent decades. Here, we present a mid-infrared soil spectral library (SSL) for central Africa (CSSL) that can predict key soil properties, allowing for future soil estimates with a minimal need for expensive and time-consuming  wet chemistry. Currently, our CSSL contains over 1800 soil samples from 10 distinct geoclimatic regions throughout the Congo Basin and along the Albertine Rift. For the analysis, we selected six regions from the CSSL, for which we built predictive models for total carbon (TC) and total nitrogen (TN) using an existing continental SSL (African Soil Information Service, AfSIS SSL; <inline-formula><mml:math id="M1" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1902</mml:mn></mml:mrow></mml:math></inline-formula>) that does not include central African soils. Using memory-based learning (MBL), we explored three different strategies at decreasing degrees of geographic extrapolation, using models built with (1) the AfSIS SSL only, (2) AfSIS SSL combined with the five remaining central African regions, and (3) a combination of AfSIS SSL, the remaining five regions, and selected samples from the target region (spiking). For this last strategy we introduce a method for spiking MBL models. We found that when using the AfSIS SSL only to predict the six central African regions, the root mean square error of the predictions (RMSE<inline-formula><mml:math id="M2" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>) was between 3.85–8.74 and 0.40–1.66 <inline-formula><mml:math id="M3" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for TC and TN, respectively. The ratio of performance to the interquartile distance (RPIQ<inline-formula><mml:math id="M4" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>) ranged between 0.96–3.95 for TC and 0.59–2.86 for TN. While the effect of the second strategy compared to the first strategy was mixed, the third strategy, spiking with samples from the target regions, could clearly reduce the RMSE<inline-formula><mml:math id="M5" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> to 3.19–7.32 <inline-formula><mml:math id="M6" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for TC and 0.24–0.89 <inline-formula><mml:math id="M7" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for TN. RPIQ<inline-formula><mml:math id="M8" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values were increased to ranges of 1.43–5.48 and 1.62–4.45 for TC and TN, respectively. In general, predicted TC and TN for soils of each of the six regions were accurate; the effect of spiking and avoiding geographical extrapolation was noticeably large. We conclude that our CSSL adds valuable soil diversity that can improve predictions for the Congo Basin region compared to using the continental AfSIS SSL alone; thus, analyses of other soils in central Africa will be able to profit from a more diverse spectral feature space. Given these promising results, the library comprises an important tool to facilitate economical soil analyses and predict soil properties in an understudied yet critical region of Africa. Our SSL is openly available for application and for enlargement with more spectral and reference data to further improve soil diagnostic accuracy and cost-effectiveness.</p>
  </abstract>
    </article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d1e459">Soil health is critical to crop nutrition, agricultural production, food security, erosion prevention, and climate change mitigation via carbon storage. Global climate change and soil degradation by deforestation and soil mismanagement critically threaten these soil ecosystem services <xref ref-type="bibr" rid="bib1.bibx16" id="paren.1"/>. In particular, the humid tropics are a front line for these anthropogenic impacts. For example, increasing temperatures and accelerating deforestation in the humid tropics are estimated to enhance greenhouse gas emissions <xref ref-type="bibr" rid="bib1.bibx24 bib1.bibx19" id="paren.2"/> but also to significantly reduce soil functions and ecosystem services such as plant nutrient supply, water storage and filtration capabilities, and erosion protection <xref ref-type="bibr" rid="bib1.bibx81" id="paren.3"/>. Despite the expected severity of these impacts, our understanding of the effects on soils in the humid tropics of Africa is limited by sparse data and uneven distribution of low-latitude research. Within the tropics, both the future impacts and data gaps are most severe in the Congo Basin, which contains the second largest tropical forest ecosystem on Earth, represents a considerable reservoir of soil carbon, and is critically endangered by fast deforestation <xref ref-type="bibr" rid="bib1.bibx32" id="paren.4"/>. Thereby, forest loss in central Africa is mainly driven by smallholder farmers practicing shifting cultivation <xref ref-type="bibr" rid="bib1.bibx77 bib1.bibx20" id="paren.5"/>  and cropland expansion to feed a fast-growing population. For example, the human population in Uganda, Rwanda, and the DRC is projected to more than double in the coming 80 years <xref ref-type="bibr" rid="bib1.bibx85" id="paren.6"/>. Such dramatic growth will likely contribute to further conversion of forest to agricultural land. As a result of these current and future impacts, more spatially explicit soil information is urgently needed in many research fields ranging from agricultural to soil biogeochemistry and climate sciences. In recent decades, improvements have been made carrying out soil surveys and creating soil databases and maps for central Africa <xref ref-type="bibr" rid="bib1.bibx29" id="paren.7"/>, for Rwanda <xref ref-type="bibr" rid="bib1.bibx34" id="paren.8"/>, and for the DRC <xref ref-type="bibr" rid="bib1.bibx4" id="paren.9"/>. Unfortunately, accessibility of such data is limited, and gaps are still large in central Africa <xref ref-type="bibr" rid="bib1.bibx80" id="paren.10"/>, in part due to the high cost of specialized equipment and chemicals for analyses, limited accessibility to sampling areas, and lack of infrastructure.</p>
      <p id="d1e493">Diffuse reflectance infrared Fourier transform (DRIFT) spectroscopy has gained attention as a cost-effective and rapid method for soil analyses <xref ref-type="bibr" rid="bib1.bibx53" id="paren.11"><named-content content-type="pre">e.g.,</named-content></xref>. Many soil minerals, as well as functional groups of soil organic matter, show distinct energy absorption features in the infrared (IR) region of the electromagnetic spectrum. These relationships can be empirically modeled to quantify soil properties relevant for soil quality, such as carbon (C), nitrogen (N), and other crop nutrients <xref ref-type="bibr" rid="bib1.bibx36 bib1.bibx71" id="paren.12"><named-content content-type="pre">e.g.,</named-content></xref>. Due to its simple handling, quick measurements, low costs, and minimal need for chemical consumables, IR spectroscopy is an important tool for soil analyses that further allows for high reproducibility and coverage of spatial soil heterogeneity. Especially in developing countries, where practices are often hampered by the prohibitive costs of conventional soil analyses, IR spectroscopy has great potential <xref ref-type="bibr" rid="bib1.bibx67 bib1.bibx60" id="paren.13"/>.</p>
      <p id="d1e509">Partial least squares (PLS) is a projection-based regression method which can be considered as the most widely used tool to calibrate models that translate spectral data into meaningful chemical and/or physical information. The method is especially useful in noncomplex contexts, where the relationships between spectra and response variables are essentially linear (e.g., spectral models developed for a small field where soil-forming factors are relatively constant). One of the main aims of establishing large-scale soil spectral libraries (SSLs) is to minimize the need for future wet chemical analyses <xref ref-type="bibr" rid="bib1.bibx73 bib1.bibx68 bib1.bibx83 bib1.bibx22" id="paren.14"><named-content content-type="pre">e.g.,</named-content></xref>. However, these libraries often span vast geographical areas that include different soil types and climate zones, which comprise complex soil organic carbon forms and mineral compositions. Due to this heterogeneity, predictions rendered by global linear regression models are often unfeasible for new local soil property assessments at a regional, field, or plot scale, especially when the new set covers a different geographical domain to the library. Despite the abundance of literature on<?pagebreak page695?> the calibration of quantitative models of soil properties using both mid-infrared (MIR) and near-infrared (NIR) data, there is still a lack of simple and efficient modeling strategies that could bring SSLs to an operational level. <xref ref-type="bibr" rid="bib1.bibx54" id="text.15"/> could considerably improve prediction accuracies for a new local set when using a compositionally related subset from a large-scale SSL, together with a small number of local reference analyses. Thus, a cost–accuracy trade-off can be met when the accuracy of the library-based prediction is similar to the one made when applying a local but more costly calibration strategy. Several data-driven methods have proven to be successful to overcome this issue, for example RS-LOCAL <xref ref-type="bibr" rid="bib1.bibx41" id="paren.16"/> and memory-based learning (a.k.a. local learning, e.g., <xref ref-type="bibr" rid="bib1.bibx50 bib1.bibx66 bib1.bibx57" id="altparen.17"/>). In addition, other promising approaches have also been proposed, although they require more research (e.g., deep learning, <xref ref-type="bibr" rid="bib1.bibx51" id="altparen.18"/>; fuzzy rule-based systems, <xref ref-type="bibr" rid="bib1.bibx76" id="altparen.19"/>). Memory-based learning (MBL), for example, searches for each new spectral observation, a subset of similar observations in a spectral library, which are then used to fit a custom predictive model for every new observation. This method has shown promising results when applied to extremely complex SSLs such as the MIR library of the United States <xref ref-type="bibr" rid="bib1.bibx21" id="paren.20"/> and in one developed for the European continent <xref ref-type="bibr" rid="bib1.bibx76" id="paren.21"/>. Spiking of libraries with samples from the target site has also shown to improve prediction accuracy <xref ref-type="bibr" rid="bib1.bibx30 bib1.bibx86 bib1.bibx64 bib1.bibx6" id="paren.22"><named-content content-type="pre">e.g.,</named-content></xref>. So far, SSLs have mainly been used for predictions of soil samples originating from the same geographical domain. Studies have shown that subsetting large-scale libraries for new spectra by their geographical zones can result in good prediction accuracy <xref ref-type="bibr" rid="bib1.bibx52 bib1.bibx69" id="paren.23"/>. These geographical restrictions could allow for extrapolation to new areas that contain similar soils.</p>
      <p id="d1e547">The aim of the present work was to propose three strategies that leverage the use of a large soil infrared spectral library to accurately predict soil properties in regions which are poorly covered by it. Furthermore, here we describe a convenient method for spiking MBL or local models. Here, we also present the first SSL for central Africa (CSSL), which can be used to enlarge the  existing continental library of African soils (a.k.a. African Soil Information Service, AfSIS). This effort represents an important first step towards fulfilling the need for spatially explicit and high-resolution soil data in an important yet understudied region in the humid tropics of Africa, promoting vital soil information that is critical to the future of the region.
<?xmltex \hack{\newpage}?></p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Methods</title>
<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>Site descriptions</title>
      <p id="d1e566">Soil samples were collected from past projects in the Congo Basin and along the Albertine Rift, the western branch of the East African Rift System. Table <xref ref-type="table" rid="Ch1.T1"/> gives an overview of corresponding data sources and data contributors to the different sample sets and denotes the origin, the number of samples, and sampling layers used for our CSSL. The sample locations of the entire library are clustered over a large geographical area of central Africa, from a latitude of 2.8 to <inline-formula><mml:math id="M9" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>11.6<inline-formula><mml:math id="M10" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula> and a longitude of 12.9 to 30.4<inline-formula><mml:math id="M11" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>. From our entire library, six clustered regions were identified, which contained at least 80 samples to allow for reliable analysis. Therefore, this subset will be further presented in the paper (see Tables <xref ref-type="table" rid="App1.Ch1.S1.T4"/> and <xref ref-type="table" rid="App1.Ch1.S1.T5"/> in the Appendix for information on the entire library). Four of the selected regions are located in the Democratic Republic of the Congo (Haut-Katanga, South Kivu, Tshopo, Tshuapa), while the other two are located in Rwanda (Iburengerazuba) and in Uganda (Kabarole), respectively (Figs. <xref ref-type="fig" rid="Ch1.F1"/> and <xref ref-type="fig" rid="App1.Ch1.S1.F6"/>). Site-specific characteristics, coordinate ranges, altitudes, average climate, and dominant soil types are summarized in Table <xref ref-type="table" rid="Ch1.T2"/>. Annual precipitation ranges from about 1200 <inline-formula><mml:math id="M12" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">mm</mml:mi></mml:mrow></mml:math></inline-formula> in Haut-Katanga to over 2000 <inline-formula><mml:math id="M13" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">mm</mml:mi></mml:mrow></mml:math></inline-formula> in the tropical forest of Tshuapa. Mean annual temperature varies from 17.6 <inline-formula><mml:math id="M14" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C in the high altitudes of Iburengerazuba and South Kivu to 24.9 <inline-formula><mml:math id="M15" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C in Tshopo <xref ref-type="bibr" rid="bib1.bibx25" id="paren.24"/>. The study elevations range from 380 <inline-formula><mml:math id="M16" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">m</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mi mathvariant="normal">a</mml:mi><mml:mo>.</mml:mo><mml:mi mathvariant="normal">s</mml:mi><mml:mo>.</mml:mo><mml:mi mathvariant="normal">l</mml:mi><mml:mo>.</mml:mo></mml:mrow></mml:math></inline-formula> in Tshuapa and Tshopo to high altitudes of 2300 <inline-formula><mml:math id="M17" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">m</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:mi mathvariant="normal">a</mml:mi><mml:mo>.</mml:mo><mml:mi mathvariant="normal">s</mml:mi><mml:mo>.</mml:mo><mml:mi mathvariant="normal">l</mml:mi><mml:mo>.</mml:mo></mml:mrow></mml:math></inline-formula> in South Kivu along the rift valley <xref ref-type="bibr" rid="bib1.bibx37" id="paren.25"/>. Soil types are primarily Ferralsols, Acrisols, or Nitisols <xref ref-type="bibr" rid="bib1.bibx38 bib1.bibx35" id="paren.26"/>. The different regions contain multiple Köppen–Geiger climatic zones: The three regions located close to the Equator (Tshuapa, Tshopo, Kabarole) are classified as Af (tropical rainforest), while the eastern DRC and western Rwanda are classified as a mixture of climate zones Cfb (temperate, without dry season, warm summer), Csb (temperate, dry summer, warm summer), Aw (tropical savannah), and Cwb (temperate, dry winter, warm summer). The regions along the rift valley (South Kivu, Iburengerazuba, Kabarole) are  partially also classified as Am (tropical monsoon). Finally, the southeast of the DRC is classified  as Cwa (temperate, dry winter, hot summer) <xref ref-type="bibr" rid="bib1.bibx14" id="paren.27"/>.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F1" specific-use="star"><?xmltex \currentcnt{1}?><?xmltex \def\figurename{Figure}?><label>Figure 1</label><caption><p id="d1e699">Locations and spectra of soil samples from the central African spectral library (CSSL) and the continental soil spectral library from the African Soil Information Service (AfSIS SSL). The samples from the six regions from the CSSL further analyzed in this study are presented with a <inline-formula><mml:math id="M18" display="inline"><mml:mo>∘</mml:mo></mml:math></inline-formula> symbol, the remaining samples of CSSL with a <inline-formula><mml:math id="M19" display="inline"><mml:mi mathvariant="italic">▿</mml:mi></mml:math></inline-formula> symbol, and the AfSIS SSL with a <inline-formula><mml:math id="M20" display="inline"><mml:mi mathvariant="italic">□</mml:mi></mml:math></inline-formula> symbol. The average resampled spectrum of each library is shown (bold line), along with the individual resampled sample spectra (transparent lines). Base map of Africa created using Natural Earth.</p></caption>
          <?xmltex \igopts{width=497.923228pt}?><graphic xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021-f01.png"/>

        </fig>

<?xmltex \floatpos{p}?><table-wrap id="Ch1.T1" orientation="landscape"><?xmltex \currentcnt{1}?><label>Table 1</label><caption><p id="d1e732"> Soil sample archive used for the central African soil spectral library. The references show the publications from which the corresponding data were sourced. For previously unpublished data, the contributor institution is listed. The listed regions are provinces of the Democratic Republic of Congo (DRC) and Rwanda (RWA) and a district of Uganda (UGA).</p></caption><oasis:table frame="topbot"><?xmltex \begin{scaleboxenv}{.92}[.92]?><oasis:tgroup cols="4">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Data source or contributor</oasis:entry>
         <oasis:entry colname="col2">Region</oasis:entry>
         <oasis:entry colname="col3"><inline-formula><mml:math id="M21" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col4">Soil depth (cm)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx9 bib1.bibx10" id="text.28"/></oasis:entry>
         <oasis:entry colname="col2">Tshopo (DRC)</oasis:entry>
         <oasis:entry colname="col3">33</oasis:entry>
         <oasis:entry colname="col4">5–10</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx27" id="text.29"/>,   <xref ref-type="bibr" rid="bib1.bibx8" id="text.30"/></oasis:entry>
         <oasis:entry colname="col2">Tshopo, South Kivu (DRC)</oasis:entry>
         <oasis:entry colname="col3">38</oasis:entry>
         <oasis:entry colname="col4">0–5, 5–20, 0–15, 15–30</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Swiss Federal Institute of Technology Zurich</oasis:entry>
         <oasis:entry colname="col2">North Kivu, South Kivu, Équateur (DRC)</oasis:entry>
         <oasis:entry colname="col3">40</oasis:entry>
         <oasis:entry colname="col4">0–5, 5–20, 0–15, 15–30, 0–100 soil pit</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx39 bib1.bibx40" id="text.31"/></oasis:entry>
         <oasis:entry colname="col2">Tshopo (DRC)</oasis:entry>
         <oasis:entry colname="col3">40</oasis:entry>
         <oasis:entry colname="col4">0–10, 10–20, 20–30,  30–50, 50–100</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx11" id="text.32"/></oasis:entry>
         <oasis:entry colname="col2">Tshopo, South Kivu (DRC)</oasis:entry>
         <oasis:entry colname="col3">12</oasis:entry>
         <oasis:entry colname="col4">0–5</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx13" id="text.33"/>, <xref ref-type="bibr" rid="bib1.bibx43" id="text.34"/></oasis:entry>
         <oasis:entry colname="col2">Tshopo (DRC)</oasis:entry>
         <oasis:entry colname="col3">208</oasis:entry>
         <oasis:entry colname="col4">0–5, 5–10, 10–20</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx12" id="text.35"/></oasis:entry>
         <oasis:entry colname="col2">Tshuapa (DRC)</oasis:entry>
         <oasis:entry colname="col3">75</oasis:entry>
         <oasis:entry colname="col4">0–10, 10–20, 20–30, 30–50, 50–100</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx42" id="text.36"/></oasis:entry>
         <oasis:entry colname="col2">Tshuapa (DRC)</oasis:entry>
         <oasis:entry colname="col3">103</oasis:entry>
         <oasis:entry colname="col4">0–20</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx74" id="text.37"/></oasis:entry>
         <oasis:entry colname="col2">Tshuapa (DRC)</oasis:entry>
         <oasis:entry colname="col3">560</oasis:entry>
         <oasis:entry colname="col4">0–20, 20–50</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx33" id="text.38"/></oasis:entry>
         <oasis:entry colname="col2">South Kivu (DRC)</oasis:entry>
         <oasis:entry colname="col3">51</oasis:entry>
         <oasis:entry colname="col4">0–20</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Université Catholique de Louvain</oasis:entry>
         <oasis:entry colname="col2">South Kivu, Haut-Katanga (DRC)</oasis:entry>
         <oasis:entry colname="col3">46</oasis:entry>
         <oasis:entry colname="col4">0–20, 20–30</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx44 bib1.bibx45 bib1.bibx46 bib1.bibx47 bib1.bibx48" id="text.39"/></oasis:entry>
         <oasis:entry colname="col2">Haut-Katanga (DRC)</oasis:entry>
         <oasis:entry colname="col3">94</oasis:entry>
         <oasis:entry colname="col4">Termite mound profiles</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">International institute of Tropical Agriculture/World Agroforestry Centre</oasis:entry>
         <oasis:entry colname="col2">Bas-Uélé, South Kivu (DRC)</oasis:entry>
         <oasis:entry colname="col3">207</oasis:entry>
         <oasis:entry colname="col4">0–20, 20–40, 20–50</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx2 bib1.bibx3" id="text.40"/></oasis:entry>
         <oasis:entry colname="col2">Lower Congo and Central (DRC)</oasis:entry>
         <oasis:entry colname="col3">40</oasis:entry>
         <oasis:entry colname="col4">0–123 soil pit</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"><xref ref-type="bibr" rid="bib1.bibx23" id="text.41"/></oasis:entry>
         <oasis:entry colname="col2">South Kivu (DRC), Iburengerazuba (RWA), Kabarole (UGA)</oasis:entry>
         <oasis:entry colname="col3">307</oasis:entry>
         <oasis:entry colname="col4">0–10, 30–40, 60–70, 90–100</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup><?xmltex \end{scaleboxenv}?></oasis:table></table-wrap>

<?xmltex \floatpos{p}?><table-wrap id="Ch1.T2" orientation="landscape"><?xmltex \currentcnt{2}?><label>Table 2</label><caption><p id="d1e1024"> Number of samples, GPS coordinates, elevation, annual precipitation (AP), mean annual temperature (MAT), Köppen–Geiger climate classifications, and soil types for the sampled regions of the Democratic Republic of Congo, Rwanda, and Uganda. Data were extracted for all coordinates from raster files. Climate data are sourced from <xref ref-type="bibr" rid="bib1.bibx25" id="text.42"/>, elevation from SRTM (90 m resolution; <xref ref-type="bibr" rid="bib1.bibx37" id="altparen.43"/>), Köppen–Geiger climate classifications from <xref ref-type="bibr" rid="bib1.bibx14" id="text.44"/>, and soil types from the Soil Atlas of Africa <xref ref-type="bibr" rid="bib1.bibx38 bib1.bibx35" id="paren.45"/>.</p></caption><oasis:table frame="topbot"><?xmltex \begin{scaleboxenv}{.97}[.97]?><oasis:tgroup cols="9">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right"/>
     <oasis:colspec colnum="8" colname="col8" align="left"/>
     <oasis:colspec colnum="9" colname="col9" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Region</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M22" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Longitude (<inline-formula><mml:math id="M23" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col4">Latitude (<inline-formula><mml:math id="M24" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col5">Elevation (m)</oasis:entry>
         <oasis:entry colname="col6">MAT (<inline-formula><mml:math id="M25" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C)</oasis:entry>
         <oasis:entry colname="col7">AP (mm)</oasis:entry>
         <oasis:entry colname="col8">Köppen–Geiger</oasis:entry>
         <oasis:entry colname="col9">Soil types</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Haut-Katanga</oasis:entry>
         <oasis:entry colname="col2">119</oasis:entry>
         <oasis:entry colname="col3">27.48–27.85</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M26" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>11.61 to <inline-formula><mml:math id="M27" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>11.29</oasis:entry>
         <oasis:entry colname="col5">1197–1323</oasis:entry>
         <oasis:entry colname="col6">20.6</oasis:entry>
         <oasis:entry colname="col7">1223</oasis:entry>
         <oasis:entry colname="col8">Cwa</oasis:entry>
         <oasis:entry colname="col9">Rhodic/Haplic Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">South Kivu</oasis:entry>
         <oasis:entry colname="col2">369</oasis:entry>
         <oasis:entry colname="col3">28.64–28.91</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M28" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.79 to <inline-formula><mml:math id="M29" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.1</oasis:entry>
         <oasis:entry colname="col5">1487–2310</oasis:entry>
         <oasis:entry colname="col6">17.6</oasis:entry>
         <oasis:entry colname="col7">1627</oasis:entry>
         <oasis:entry colname="col8">Cfb, Csb, Aw, Cwb</oasis:entry>
         <oasis:entry colname="col9">Umbric Ferralsols, Haplic Acrisols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Tshopo</oasis:entry>
         <oasis:entry colname="col2">315</oasis:entry>
         <oasis:entry colname="col3">24.48–25.32</oasis:entry>
         <oasis:entry colname="col4">0.29–0.83</oasis:entry>
         <oasis:entry colname="col5">380–506</oasis:entry>
         <oasis:entry colname="col6">24.9</oasis:entry>
         <oasis:entry colname="col7">1789</oasis:entry>
         <oasis:entry colname="col8">Af</oasis:entry>
         <oasis:entry colname="col9">Xanthic/Haplic Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Tshuapa</oasis:entry>
         <oasis:entry colname="col2">738</oasis:entry>
         <oasis:entry colname="col3">21.84–22.53</oasis:entry>
         <oasis:entry colname="col4">0.28–0.8</oasis:entry>
         <oasis:entry colname="col5">385–578</oasis:entry>
         <oasis:entry colname="col6">24.7</oasis:entry>
         <oasis:entry colname="col7">2090</oasis:entry>
         <oasis:entry colname="col8">Af</oasis:entry>
         <oasis:entry colname="col9">Xanthic/Haplic Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Iburengerazuba</oasis:entry>
         <oasis:entry colname="col2">107</oasis:entry>
         <oasis:entry colname="col3">29.05–29.22</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M30" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.47 to <inline-formula><mml:math id="M31" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.34</oasis:entry>
         <oasis:entry colname="col5">1565–1939</oasis:entry>
         <oasis:entry colname="col6">17.6</oasis:entry>
         <oasis:entry colname="col7">1496</oasis:entry>
         <oasis:entry colname="col8">Csb, Aw, Cwb</oasis:entry>
         <oasis:entry colname="col9">Haplic/Umbric Acrisols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Kabarole</oasis:entry>
         <oasis:entry colname="col2">101</oasis:entry>
         <oasis:entry colname="col3">30.13–30.37</oasis:entry>
         <oasis:entry colname="col4">0.46–0.63</oasis:entry>
         <oasis:entry colname="col5">1271–1824</oasis:entry>
         <oasis:entry colname="col6">19.7</oasis:entry>
         <oasis:entry colname="col7">1360</oasis:entry>
         <oasis:entry colname="col8">Af, Cfb, Am</oasis:entry>
         <oasis:entry colname="col9">Haplic Phaeozems, Rhodic Nitisols, Albic Luvisols</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup><?xmltex \end{scaleboxenv}?></oasis:table></table-wrap>

</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title>Laboratory soil analyses</title>
      <p id="d1e1367">In preparation for total carbon (TC) and total nitrogen (TN) analyses, all soil samples were sieved through a 2 <inline-formula><mml:math id="M32" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">mm</mml:mi></mml:mrow></mml:math></inline-formula> mesh and either air-dried or oven-dried at temperatures of 50 or 60 <inline-formula><mml:math id="M33" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C. After sieving and drying, soil samples were ground to a powder (<inline-formula><mml:math id="M34" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">50</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M35" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>m) using a ball mill. TC and TN were analyzed via dry combustion using either a LECO 628 elemental analyzer (LECO Corporation, USA), an ANCA-SL automated nitrogen carbon analyzer (SerCon, UK), or<?pagebreak page696?> a vario EL cube CNS elemental analyzer (Elementar, Germany). In order to ensure data quality and facilitate the harmonization of all TC and TN data, a subset of these samples was remeasured on the LECO. This performance comparison demonstrated high comparability of TC and TN data across all three instruments (<inline-formula><mml:math id="M36" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.99</mml:mn></mml:mrow></mml:math></inline-formula> for TC and TN, results not shown). The large majority of the soil samples originate from highly weathered and acidic soils and do not contain any carbonates, and therefore, TC contents correspond to total organic carbon contents. Only in a few samples from termite mounds in the subtropical Haut-Katanga province has calcium carbonate been detected where pH values are <inline-formula><mml:math id="M37" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">8</mml:mn></mml:mrow></mml:math></inline-formula> <xref ref-type="bibr" rid="bib1.bibx44" id="paren.46"/>. Moreover, the widely used slash-and-burn practices could additionally have influenced soil TC contents, even when visible charcoal pieces were removed prior to any measurement. Additionally, soil pH (either in H<inline-formula><mml:math id="M38" display="inline"><mml:msub><mml:mi/><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:math></inline-formula>O, KCl or CaCl<inline-formula><mml:math id="M39" display="inline"><mml:msub><mml:mi/><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:math></inline-formula>, depending on the study), texture (laser diffraction particle size analyzer), and aqua-regia-extractable macro-/micronutrients (Al, Fe, Ca, Mg, Mn, Na, P, and K; inductively coupled plasma-optical emission spectroscopy) were analyzed for a subset of samples. The chemical and MIR prediction results for these soil characteristics are not presented in this paper but were carried out using the same methods and are available on our GitHub repository at <uri>https://doi.org/10.5281/zenodo.4351254</uri> (last access: 20 December 2020).</p>
</sec>
<sec id="Ch1.S2.SS3">
  <label>2.3</label><title>MIR spectral libraries</title>
<sec id="Ch1.S2.SS3.SSS1">
  <label>2.3.1</label><title>Central African spectral library</title>
      <p id="d1e1470">In order to determine the MIR reflectance, all ground soil samples were measured with a VERTEX70 Fourier transform IR (FT-IR) spectrometer with a high-throughput screening extension (HTS-XT) (Bruker Optics GmbH, Germany). Spectra were acquired at a resolution of 2 <inline-formula><mml:math id="M40" display="inline"><mml:mrow class="unit"><mml:msup><mml:mi mathvariant="normal">cm</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> within a range of 7500 to 600 <inline-formula><mml:math id="M41" display="inline"><mml:mrow class="unit"><mml:msup><mml:mi mathvariant="normal">cm</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, which corresponds to a wavelength range of 1333 to 16 667 <inline-formula><mml:math id="M42" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">nm</mml:mi></mml:mrow></mml:math></inline-formula>. A gold coated reflectance standard (Infragold NIR-MIR Reflectance Coating, Labsphere) was used as a background material for all measured soils in order to normalize the sample spectra. Reflectance was transformed into absorbance using log(1/reflectance) prior to further processing and subsequent modeling. Two replicates per sample were filled into the cups of a 24-well plate, and the surface was flattened without compression using a spatula. For each replicate, 32 co-added internal measurements were averaged and corrected for CO<inline-formula><mml:math id="M43" display="inline"><mml:msub><mml:mi/><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:math></inline-formula> and H<inline-formula><mml:math id="M44" display="inline"><mml:msub><mml:mi/><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:math></inline-formula>O using OPUS spectrometer software (Bruker Optics GmbH, Germany). This library is denoted as <inline-formula><mml:math id="M45" display="inline"><mml:mrow><mml:mi>C</mml:mi><mml:mo>=</mml:mo><mml:mo mathvariant="italic">{</mml:mo><mml:mi mathvariant="normal">Yc</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="normal">Xc</mml:mi><mml:msubsup><mml:mo mathvariant="italic">}</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mi>m</mml:mi></mml:msubsup></mml:mrow></mml:math></inline-formula> throughout the rest of the paper, where <inline-formula><mml:math id="M46" display="inline"><mml:mi mathvariant="normal">Yc</mml:mi></mml:math></inline-formula> is the matrix containing the two response variables (TC and TN), <inline-formula><mml:math id="M47" display="inline"><mml:mi mathvariant="normal">Xc</mml:mi></mml:math></inline-formula> is the matrix of spectra, and <inline-formula><mml:math id="M48" display="inline"><mml:mi>m</mml:mi></mml:math></inline-formula> is the total number of samples in the library.</p><?xmltex \hack{\newpage}?>
</sec>
<?pagebreak page698?><sec id="Ch1.S2.SS3.SSS2">
  <label>2.3.2</label><title>AfSIS spectral library</title>
      <p id="d1e1583">We used a MIR SSL created by the World Agroforestry Centre (ICRAF) to predict soil samples of the six selected regions of central Africa for their TC and TN contents. This SSL was created as part of the Africa Soil Information Service (AfSIS) in order to improve soil information and land management on the continental scale of sub-Saharan Africa <xref ref-type="bibr" rid="bib1.bibx79" id="paren.47"/>. For this continental library (see Fig. <xref ref-type="fig" rid="Ch1.F1"/>), reference values for TC and TN were measured using a ThermoQuest EA 1112 elemental analyzer. The MIR spectra of the samples were obtained by scanning them on a Tensor27 FT-IR spectrometer (Bruker Optics GmbH, Germany) with a high-throughput screening extension. Soil samples were measured in a wavenumber range of 4000 to 600 <inline-formula><mml:math id="M49" display="inline"><mml:mrow class="unit"><mml:msup><mml:mi mathvariant="normal">cm</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> (2500 to 16 666 <inline-formula><mml:math id="M50" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">nm</mml:mi></mml:mrow></mml:math></inline-formula>) with a spectral resolution of 2 <inline-formula><mml:math id="M51" display="inline"><mml:mrow class="unit"><mml:msup><mml:mi mathvariant="normal">cm</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>. Four replicates per sample were measured, and an average of 32 co-added scans were used for each sample <xref ref-type="bibr" rid="bib1.bibx70" id="paren.48"/>. Here we denote this library as <inline-formula><mml:math id="M52" display="inline"><mml:mrow><mml:mi>A</mml:mi><mml:mo>=</mml:mo><mml:mo mathvariant="italic">{</mml:mo><mml:mi mathvariant="normal">Ya</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="normal">Xa</mml:mi><mml:msubsup><mml:mo mathvariant="italic">}</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mi>n</mml:mi></mml:msubsup></mml:mrow></mml:math></inline-formula> throughout the rest of the paper, where for all its samples (<inline-formula><mml:math id="M53" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula>), <inline-formula><mml:math id="M54" display="inline"><mml:mi mathvariant="normal">Ya</mml:mi></mml:math></inline-formula> represents the matrix containing the two response variables (TC and TN), and <inline-formula><mml:math id="M55" display="inline"><mml:mi mathvariant="normal">Xa</mml:mi></mml:math></inline-formula> represents the matrix of spectra.</p>
</sec>
</sec>
<sec id="Ch1.S2.SS4">
  <label>2.4</label><title>Spectral resampling and preprocessing</title>
      <p id="d1e1686">All CSSL and AfSIS spectra were processed using the R packages “prospectr” <xref ref-type="bibr" rid="bib1.bibx72" id="paren.49"/>, “simplerspec” <xref ref-type="bibr" rid="bib1.bibx7" id="paren.50"/>, and “resemble” <xref ref-type="bibr" rid="bib1.bibx56" id="paren.51"/> in the R statistical computing environment <xref ref-type="bibr" rid="bib1.bibx55" id="paren.52"/>. Replicates of spectral measurements were aggregated to one average spectrum per sample. The spectra were then resampled to a resolution of 16 cm<inline-formula><mml:math id="M56" display="inline"><mml:msup><mml:mi/><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula> and trimmed to a spectral range of 4000–600 cm<inline-formula><mml:math id="M57" display="inline"><mml:msup><mml:mi/><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula>. Both spectral libraries were scanned on two FT-IR Bruker spectrometers (Bruker Optics GmbH, Germany), which use the same settings and the same internal standards. The scanning methods of the CSSL were adapted to the standard operating procedures of the Soil Plant Spectral Diagnostics Laboratory at ICRAF. For these reasons, no instrument standardization was necessary.</p>
      <p id="d1e1726">As spectral pretreatments have a marked impact on the performance of quantitative infrared models <xref ref-type="bibr" rid="bib1.bibx61 bib1.bibx65" id="paren.53"/>, the preprocessing procedure was specifically optimized for the MIR spectra of the central African samples. This procedure was based on the PLS method <xref ref-type="bibr" rid="bib1.bibx89" id="paren.54"/>, which is also known as projection to latent structures and is widely used for regression analysis in infrared spectroscopy. However, it is also useful for projecting the spectral data onto a low-dimensional (and therefore less complex) subspace containing all the meaningful information of the original data. The projection model can be expressed as
            <disp-formula id="Ch1.E1" content-type="numbered"><label>1</label><mml:math id="M58" display="block"><mml:mrow><mml:mi mathvariant="bold">X</mml:mi><mml:mo>=</mml:mo><mml:msup><mml:mi mathvariant="bold">SP</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>+</mml:mo><mml:mi>E</mml:mi><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where <inline-formula><mml:math id="M59" display="inline"><mml:mi mathvariant="bold">X</mml:mi></mml:math></inline-formula> is the original spectral matrix of <inline-formula><mml:math id="M60" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>×</mml:mo><mml:mi>d</mml:mi></mml:mrow></mml:math></inline-formula> dimensions, <inline-formula><mml:math id="M61" display="inline"><mml:mi mathvariant="bold">S</mml:mi></mml:math></inline-formula> is the PLS score matrix of <inline-formula><mml:math id="M62" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>×</mml:mo><mml:mi>l</mml:mi></mml:mrow></mml:math></inline-formula> dimensions (where <inline-formula><mml:math id="M63" display="inline"><mml:mrow><mml:mi>l</mml:mi><mml:mo>≤</mml:mo><mml:mo>min⁡</mml:mo><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:mo>,</mml:mo><mml:mi>d</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>) which contains the extracted variables, and <inline-formula><mml:math id="M64" display="inline"><mml:mi mathvariant="bold">P</mml:mi></mml:math></inline-formula> is the matrix of loadings of <inline-formula><mml:math id="M65" display="inline"><mml:mrow><mml:mi>d</mml:mi><mml:mo>×</mml:mo><mml:mi>l</mml:mi></mml:mrow></mml:math></inline-formula> dimensions which captures the spectral variability across observations. <inline-formula><mml:math id="M66" display="inline"><mml:mi>E</mml:mi></mml:math></inline-formula> is an error term. For spectral data with high collinearity, the optimal <inline-formula><mml:math id="M67" display="inline"><mml:mi>l</mml:mi></mml:math></inline-formula> (or the number of PLS factors) is usually small, which means that only a few PLS factors or latent variables are enough to properly represent the original variability of <inline-formula><mml:math id="M68" display="inline"><mml:mi mathvariant="bold">X</mml:mi></mml:math></inline-formula>. An important aspect of this type of projection is that it is obtained in such a way that the covariance between <inline-formula><mml:math id="M69" display="inline"><mml:mi mathvariant="bold">S</mml:mi></mml:math></inline-formula> and an external set of one or more variables is maximized. For a detailed description on PLS we refer the reader to <xref ref-type="bibr" rid="bib1.bibx90" id="text.55"/>. In PLS, <inline-formula><mml:math id="M70" display="inline"><mml:mi mathvariant="bold">P</mml:mi></mml:math></inline-formula> can be used on new spectral observations to project them onto the lower dimensional subspace:
            <disp-formula id="Ch1.E2" content-type="numbered"><label>2</label><mml:math id="M71" display="block"><mml:mrow><mml:msub><mml:mi mathvariant="bold">S</mml:mi><mml:mtext>new</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mtext>new</mml:mtext></mml:msub><mml:msup><mml:mi mathvariant="bold">P</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d1e1902">The spectral reconstruction residuals of the projection model can then be computed by back-transforming the matrix of scores to a spectral matrix and comparing it against the original spectral matrix as follows:
            <disp-formula id="Ch1.E3" content-type="numbered"><label>3</label><mml:math id="M72" display="block"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mtext>new</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mtext>new</mml:mtext></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi mathvariant="bold">S</mml:mi><mml:mtext>new</mml:mtext></mml:msub><mml:msup><mml:mi mathvariant="bold">P</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d1e1936">Finally, the spectral reconstruction error (also known as the <inline-formula><mml:math id="M73" display="inline"><mml:mi>Q</mml:mi></mml:math></inline-formula> statistic) is computed as the sum of squares of <inline-formula><mml:math id="M74" display="inline"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mtext>new</mml:mtext></mml:msub></mml:mrow></mml:math></inline-formula>:
            <disp-formula id="Ch1.E4" content-type="numbered"><label>4</label><mml:math id="M75" display="block"><mml:mrow><mml:msub><mml:mi>Q</mml:mi><mml:mtext>new</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>E</mml:mi><mml:mtext>new</mml:mtext></mml:msub><mml:msub><mml:msup><mml:mi>E</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mtext>new</mml:mtext></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d1e1985">The <inline-formula><mml:math id="M76" display="inline"><mml:mi>Q</mml:mi></mml:math></inline-formula> statistic indicates how well a given new sample is represented by the PLS model <xref ref-type="bibr" rid="bib1.bibx87 bib1.bibx5" id="paren.56"/>. This statistic is widely used in chemometrics for outlier identification and uncertainty assessment <xref ref-type="bibr" rid="bib1.bibx88" id="paren.57"/>.</p>
      <?pagebreak page699?><p id="d1e2001">In summary, our approach offers a data-driven solution to the selection of the spectral preprocessing steps which are optimized for the target/prediction set. The optimal set of steps is defined as the one that minimizes the <inline-formula><mml:math id="M77" display="inline"><mml:mi>Q</mml:mi></mml:math></inline-formula> statistic. This approach does not require prior knowledge of the response values of the target set and therefore is well suited for preprocessing optimization. It assumes that PLS models that cannot account for the spectral variability in the target set may also fail at producing accurate predictions of the response variable. In other words, as suggested by <xref ref-type="bibr" rid="bib1.bibx88" id="text.58"/>, large <inline-formula><mml:math id="M78" display="inline"><mml:mi>Q</mml:mi></mml:math></inline-formula> values can be used as proxies for large prediction errors, and therefore <inline-formula><mml:math id="M79" display="inline"><mml:mi>Q</mml:mi></mml:math></inline-formula> values can be used to judge the suitability of a set of preprocessing steps.
To find an optimal combination of spectral pretreatments, we defined a set of different pretreatments <inline-formula><mml:math id="M80" display="inline"><mml:mrow><mml:mo mathvariant="italic">{</mml:mo><mml:msub><mml:mi>h</mml:mi><mml:mn mathvariant="normal">1</mml:mn></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>h</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mo>,</mml:mo><mml:mi mathvariant="normal">…</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mi>h</mml:mi><mml:mi>z</mml:mi></mml:msub><mml:mo mathvariant="italic">}</mml:mo></mml:mrow></mml:math></inline-formula>, where <inline-formula><mml:math id="M81" display="inline"><mml:mrow><mml:msub><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> represents one pretreatment or a sequence of pretreatments (with unique parameter values) to be applied on the spectral data. For this purpose, a projection model was built with the AfSIS spectra (using TC and TN as external variables) for each combination of spectral pretreatments:
            <disp-formula id="Ch1.E5" content-type="numbered"><label>5</label><mml:math id="M82" display="block"><mml:mrow><mml:msub><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Xa</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mi mathvariant="normal">Sa</mml:mi><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo><mml:msup><mml:mi mathvariant="normal">Pa</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>
          This model was then used on the CSSL pretreated spectra with reconstruction residuals (<inline-formula><mml:math id="M83" display="inline"><mml:mi mathvariant="normal">Ec</mml:mi></mml:math></inline-formula>) computed as follows:
            <disp-formula id="Ch1.E6" content-type="numbered"><label>6</label><mml:math id="M84" display="block"><mml:mrow><mml:mi mathvariant="normal">Ec</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Xc</mml:mi><mml:mo>)</mml:mo><mml:mo>-</mml:mo><mml:mo>[</mml:mo><mml:msub><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Xc</mml:mi><mml:mo>)</mml:mo><mml:msup><mml:mi mathvariant="normal">Pa</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup><mml:msup><mml:mi mathvariant="normal">ScPa</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo><mml:mo>]</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where <inline-formula><mml:math id="M85" display="inline"><mml:mi mathvariant="normal">Pa</mml:mi></mml:math></inline-formula> denotes the loadings corresponding to the PLS model built with the AfSIS library and <inline-formula><mml:math id="M86" display="inline"><mml:mi mathvariant="normal">Sc</mml:mi></mml:math></inline-formula> the projected scores of the central African Library.</p>
      <p id="d1e2195">For this analysis we fixed the number of PLS factors to 20 because projected variables beyond this dimension did not capture a sufficient amount of the original spectral variance. For example, PLS variable 21 amounted to less than 0.01 <inline-formula><mml:math id="M87" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">%</mml:mi></mml:mrow></mml:math></inline-formula> of the original variance in all the cases. The mean <inline-formula><mml:math id="M88" display="inline"><mml:mi>Q</mml:mi></mml:math></inline-formula> value (<inline-formula><mml:math id="M89" display="inline"><mml:mover accent="true"><mml:mi>Q</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:math></inline-formula>) for the <inline-formula><mml:math id="M90" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>th set of pretreatments was obtained by
            <disp-formula id="Ch1.E7" content-type="numbered"><label>7</label><mml:math id="M91" display="block"><mml:mrow><mml:mover accent="true"><mml:mi>Q</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mrow><mml:mi>m</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi>d</mml:mi></mml:mrow></mml:mfrac></mml:mstyle><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msub><mml:mtext>Ec</mml:mtext><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mtext>Ec</mml:mtext><mml:mi>j</mml:mi><mml:mo>′</mml:mo></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where <inline-formula><mml:math id="M92" display="inline"><mml:mi>m</mml:mi></mml:math></inline-formula>  and <inline-formula><mml:math id="M93" display="inline"><mml:mi>d</mml:mi></mml:math></inline-formula> are the number of samples and the number of spectral variables in the CSSL respectively. To allow for comparisons across the reconstruction errors obtained for the different pretreatments, <inline-formula><mml:math id="M94" display="inline"><mml:mover accent="true"><mml:mi>Q</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:math></inline-formula> was standardized as follows:
            <disp-formula id="Ch1.E8" content-type="numbered"><label>8</label><mml:math id="M95" display="block"><mml:mrow><mml:mi>s</mml:mi><mml:mover accent="true"><mml:mi>Q</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mover accent="true"><mml:mi>Q</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mtext>max</mml:mtext><mml:mo>(</mml:mo><mml:msub><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Xc</mml:mi><mml:mo>)</mml:mo><mml:mo>)</mml:mo><mml:mo>-</mml:mo><mml:mtext>min</mml:mtext><mml:mo>(</mml:mo><mml:msub><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mi mathvariant="normal">Xc</mml:mi><mml:mo>)</mml:mo><mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d1e2384">Tested pretreatments included different combinations of standard normal variate, multiplicative scatter correction, spectral detrending, first and second derivatives, and window sizes from 3 to 35 points in increments of 2. Minimal spectral reconstruction error was achieved with a Savitzky–Golay filter with a second-order derivative using a second-order polynomial approximation with a window size of 17 cm<inline-formula><mml:math id="M96" display="inline"><mml:msup><mml:mi/><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula> <xref ref-type="bibr" rid="bib1.bibx63" id="paren.59"/>, and a subsequent multiplicative scatter correction. This pretreatment was then applied to the spectra prior to MBL.</p>
</sec>
<sec id="Ch1.S2.SS5">
  <label>2.5</label><title>Principal component analysis data visualization</title>
      <p id="d1e2411">To analyze the difference between the two spectral libraries and to visualize the similarities between soil samples, a principal component analysis (PCA) was conducted on the preprocessed spectra of both libraries. The PCA was performed with centering but without scaling of the absorbance values.</p>
</sec>
<sec id="Ch1.S2.SS6">
  <label>2.6</label><title>Modeling approach</title>
      <p id="d1e2422">In the following we describe the method we used to assess the performance of MBL for predicting TC and TN for six distinct regions at different scenarios of regional soil extrapolation. Three specific modeling strategies were tested on the selected regional sets which we call validation sets (see Sect. <xref ref-type="sec" rid="Ch1.S2.SS6.SSS2"/>). With the regional analysis we demonstrate how predictions of soil properties within new sites from distinct regions – which are compositionally less variable than the available SSLs – perform and profit from knowledge present in the AfSIS SSL. The analysis also demonstrates the added value of our new CSSL in addition to the AfSIS SSL alone. Doing so, the aims of the modeling scenarios were (1) to minimize the costs and time for traditional methods by optimizing the transfer of stored spectral information to the new region of interest and (2) to test different levels of geographical extrapolations for new regions, when no chemical analyses of local samples are available.</p>
<sec id="Ch1.S2.SS6.SSS1">
  <label>2.6.1</label><title>Modeling and prediction data</title>
      <p id="d1e2434">We used two main data sources and subsets as follows:
<list list-type="order"><list-item>
      <p id="d1e2439"><italic>The AfSIS data set</italic> (<inline-formula><mml:math id="M97" display="inline"><mml:mi mathvariant="normal">A</mml:mi></mml:math></inline-formula>). The continental SSL from sub-Saharan Africa includes 1902 soil samples with both MIR spectra data and analytical reference data (Fig. <xref ref-type="fig" rid="Ch1.F1"/>).</p></list-item><list-item>
      <p id="d1e2454"><italic>The central African data set</italic> (<inline-formula><mml:math id="M98" display="inline"><mml:mi mathvariant="script">C</mml:mi></mml:math></inline-formula>). The central African set comprises a total of 1578 soil samples which originate from six regions (<inline-formula><mml:math id="M99" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), namely Haut-Katanga (119 samples), South Kivu (367 samples), Tshopo (134 samples), Tshuapa (738 samples), Iburengerazuba (104 samples), and Kabarole (100 samples), after the removal of one outlier sample from South Kivu with a large Mahalanobis distance to the AfSIS SSL and therefore high prediction uncertainties (distance <inline-formula><mml:math id="M100" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:math></inline-formula>; results not shown). Each regional set was split up into a regional validation set (<inline-formula><mml:math id="M101" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M102" display="inline"><mml:mo>\</mml:mo></mml:math></inline-formula> <inline-formula><mml:math id="M103" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) and a spiking set (<inline-formula><mml:math id="M104" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>). For this work we differentiated between three different subsets which are defined as follows:
<list list-type="alpha-lower"><list-item>
      <p id="d1e2530">the union of the six regional subsets <inline-formula><mml:math id="M105" display="inline"><mml:mi mathvariant="script">C</mml:mi></mml:math></inline-formula>:<disp-formula id="Ch1.E9" content-type="numbered"><label>9</label><mml:math id="M106" display="block"><mml:mrow><mml:mi mathvariant="script">C</mml:mi><mml:mo>=</mml:mo><mml:munderover><mml:mo movablelimits="false">⋃</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mn mathvariant="normal">6</mml:mn></mml:munderover><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>;</mml:mo></mml:mrow></mml:math></disp-formula></p></list-item><list-item>
      <p id="d1e2564">regional validation subsets, which are the regional sets without the spiking  samples <inline-formula><mml:math id="M107" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M108" display="inline"><mml:mo>\</mml:mo></mml:math></inline-formula> <inline-formula><mml:math id="M109" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>;</p></list-item><list-item>
      <p id="d1e2597">six representative regional spiking subsets <inline-formula><mml:math id="M110" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, which were selected from each regional set <inline-formula><mml:math id="M111" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, using the <inline-formula><mml:math id="M112" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means sampling method, which selects one sample per cluster calculated on a principal component analysis as described in <xref ref-type="bibr" rid="bib1.bibx49" id="text.60"/> (for examples on <inline-formula><mml:math id="M113" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means sampling in soil spectroscopy, we refer the reader to <xref ref-type="bibr" rid="bib1.bibx59 bib1.bibx84 bib1.bibx82" id="text.61"/>); a size of 20 samples per region was selected to show a pronounced effect of spiking that avoided any geographical extrapolation.</p></list-item></list></p></list-item></list></p>
</sec>
<sec id="Ch1.S2.SS6.SSS2">
  <label>2.6.2</label><title>Modeling strategies</title>
      <p id="d1e2651">Three different scenarios were compared which are related to the degree of the geographical extrapolation:
<list list-type="bullet"><list-item>
      <p id="d1e2656"><italic>Strategy 1</italic>. MBL predictions for the regional validation subsets (<inline-formula><mml:math id="M114" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>\</mml:mo><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) were computed from models built only with <inline-formula><mml:math id="M115" display="inline"><mml:mi mathvariant="normal">A</mml:mi></mml:math></inline-formula>. This scenario represents an extreme case of extrapolation (from the geographical perspective) because no samples from the entire central African area are present in the AfSIS set (Fig. <xref ref-type="fig" rid="Ch1.F1"/>), which is the only data used to build the predictive models.</p></list-item><list-item>
      <p id="d1e2689"><italic>Strategy 2</italic>. Predictions for every <inline-formula><mml:math id="M116" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>\</mml:mo><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are computed using MBL models built from the pooled AfSIS data <inline-formula><mml:math id="M117" display="inline"><mml:mi mathvariant="normal">A</mml:mi></mml:math></inline-formula> together with the data from the remaining five regions <inline-formula><mml:math id="M118" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="script">C</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, i.e., <inline-formula><mml:math id="M119" display="inline"><mml:mrow><mml:mi mathvariant="normal">A</mml:mi><mml:mo>∪</mml:mo><mml:msub><mml:mi mathvariant="script">C</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>, where</p>
      <p id="d1e2745"><disp-formula id="Ch1.E10" content-type="numbered"><label>10</label><mml:math id="M120" display="block"><mml:mrow><mml:msub><mml:mi mathvariant="script">C</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:munderover><mml:mo movablelimits="false">⋃</mml:mo><mml:mstyle scriptlevel="+1"><mml:mtable class="substack"><mml:mtr><mml:mtd><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mi>j</mml:mi><mml:mo>∉</mml:mo><mml:mi>i</mml:mi></mml:mtd></mml:mtr></mml:mtable></mml:mstyle><mml:mn mathvariant="normal">6</mml:mn></mml:munderover><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>\</mml:mo><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d1e2796">Strategy 2 evokes less pronounced geographical extrapolation than strategy 1.</p></list-item><list-item>
      <p id="d1e2800"><italic>Strategy 3</italic>. This time, strategy 2 was repeated, but extrapolation was avoided using the spiking samples from the same geographical region. Each regional set <inline-formula><mml:math id="M121" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">G</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>\</mml:mo><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> was predicted by the pooled AfSIS data, the data of the remaining regions, and the respective spiking set, i.e., <inline-formula><mml:math id="M122" display="inline"><mml:mrow><mml:mi mathvariant="normal">A</mml:mi><mml:mo>∪</mml:mo><mml:msub><mml:mi mathvariant="script">C</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>∪</mml:mo><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>.</p></list-item></list></p>
</sec>
</sec>
<?pagebreak page700?><sec id="Ch1.S2.SS7">
  <label>2.7</label><title>Predictive modeling</title>
      <p id="d1e2854">We used MBL as our predictive modeling approach. In the chemometrics literature, MBL is also known as local modeling, which describes a family of (nonlinear) machine learning methods designed to handle complex spectral data sets <xref ref-type="bibr" rid="bib1.bibx58" id="paren.62"/>. This type of learning method does not attempt to fit a general (global) predictive function using all available data. Instead, a new and unique function (<inline-formula><mml:math id="M123" display="inline"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) is built on demand, every time a new prediction for a given response variable is required. This new function is built using only a subset of relevant observations from a reference set that are queried through a <inline-formula><mml:math id="M124" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-nearest neighbor search. The MBL method implemented for this study uses a spectral nearest neighbor search based on a moving window correlation dissimilarity. To measure the dissimilarity (<inline-formula><mml:math id="M125" display="inline"><mml:mi>r</mml:mi></mml:math></inline-formula>) between two spectra (<inline-formula><mml:math id="M126" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M127" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>), the following equation was used:
            <disp-formula id="Ch1.E11" content-type="numbered"><label>11</label><mml:math id="M128" display="block"><mml:mrow><mml:mi>r</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>;</mml:mo><mml:mi>w</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>w</mml:mi></mml:mrow></mml:mfrac></mml:mstyle><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mo>-</mml:mo><mml:mi>w</mml:mi></mml:mrow></mml:munderover><mml:mn mathvariant="normal">1</mml:mn><mml:mo>-</mml:mo><mml:mi mathvariant="italic">ρ</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:mo mathvariant="italic">{</mml:mo><mml:mi>k</mml:mi><mml:mo>:</mml:mo><mml:mi>k</mml:mi><mml:mo>+</mml:mo><mml:mi>w</mml:mi><mml:mo mathvariant="italic">}</mml:mo></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mo>,</mml:mo><mml:mo mathvariant="italic">{</mml:mo><mml:mi>k</mml:mi><mml:mo>:</mml:mo><mml:mi>k</mml:mi><mml:mo>+</mml:mo><mml:mi>w</mml:mi><mml:mo mathvariant="italic">}</mml:mo></mml:mrow></mml:msub><mml:mo>)</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where <inline-formula><mml:math id="M129" display="inline"><mml:mi>d</mml:mi></mml:math></inline-formula> is the number of spectral variables, <inline-formula><mml:math id="M130" display="inline"><mml:mi mathvariant="italic">ρ</mml:mi></mml:math></inline-formula> represents the Pearson's correlation function, and <inline-formula><mml:math id="M131" display="inline"><mml:mi>w</mml:mi></mml:math></inline-formula> is the size of a moving window. This window size was optimized based on a spectral nearest-neighbor search within the AfSIS library. For every sample in the AfSIS library, its closest sample (in the spectral space) was identified. Then, samples were compared against their closest neighbors in terms of TC and TN and root mean squared differences (RMSDs), computed according to the following equations:
            <disp-formula id="Ch1.E12" content-type="numbered"><label>12</label><mml:math id="M132" display="block"><mml:mrow><mml:mi>j</mml:mi><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mtext>NN</mml:mtext><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">xa</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msup><mml:mi mathvariant="normal">Xa</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msup><mml:mo>)</mml:mo></mml:mrow></mml:math></disp-formula></p>
      <p id="d1e3083"><disp-formula id="Ch1.E13" content-type="numbered"><label>13</label><mml:math id="M133" display="block"><mml:mrow><mml:mtext>RMSD</mml:mtext><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>m</mml:mi></mml:mrow></mml:mfrac></mml:mstyle><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>h</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mn mathvariant="normal">2</mml:mn></mml:munderover><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">ya</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:mi>h</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi mathvariant="normal">ya</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mo>(</mml:mo><mml:mi>i</mml:mi><mml:mo>)</mml:mo><mml:mo>,</mml:mo><mml:mi>h</mml:mi></mml:mrow></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:msqrt><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where NN<inline-formula><mml:math id="M134" display="inline"><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">xa</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msup><mml:mi mathvariant="normal">Xa</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msup><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula> represents a function to obtain the index of the nearest neighbor of the <inline-formula><mml:math id="M135" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>th observation found in Xa (excluding the <inline-formula><mml:math id="M136" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>th observation), and <inline-formula><mml:math id="M137" display="inline"><mml:mrow><mml:mi>y</mml:mi><mml:msub><mml:mi>c</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the value of the <inline-formula><mml:math id="M138" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>th observation for the <inline-formula><mml:math id="M139" display="inline"><mml:mi>h</mml:mi></mml:math></inline-formula>th property variable (either TC or TN). In total 10 window sizes were evaluated using this approach (from 31 up to 121 in steps of 10), and according to the RMSD, an optimal window size <inline-formula><mml:math id="M140" display="inline"><mml:mi>w</mml:mi></mml:math></inline-formula> of 71 was chosen.</p>
      <p id="d1e3246">After nearest neighbor retrieval, our MBL method fits a local model using the weighted average partial least squares (WA-PLS) regression algorithm proposed by <xref ref-type="bibr" rid="bib1.bibx66" id="text.63"/>. In this WA-PLS, the final prediction is a weighted average of multiple predictions generated by PLS models built from different PLS factors. A range of latent variables from 5 to 30 in increments of 1 was used for the WA-PLS calculations. The weight for each component is calculated as follows:
            <disp-formula id="Ch1.E14" content-type="numbered"><label>14</label><mml:math id="M141" display="block"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>:</mml:mo><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>×</mml:mo><mml:msub><mml:mi>g</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
          where <inline-formula><mml:math id="M142" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>:</mml:mo><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the root mean square of the spectral residuals of the new observation when a total of <inline-formula><mml:math id="M143" display="inline"><mml:mi>j</mml:mi></mml:math></inline-formula> PLS components are used (i.e., all the components from the first one to the <inline-formula><mml:math id="M144" display="inline"><mml:mi>j</mml:mi></mml:math></inline-formula>th one), and <inline-formula><mml:math id="M145" display="inline"><mml:mrow><mml:msub><mml:mi>g</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the root mean square of the regression coefficients corresponding to the <inline-formula><mml:math id="M146" display="inline"><mml:mi>j</mml:mi></mml:math></inline-formula>th PLS component (see <xref ref-type="bibr" rid="bib1.bibx66" id="altparen.64"/>, for more details).</p>
      <p id="d1e3341">The number of neighbors that needed to be retrieved was optimized using nearest neighbor (NN) cross-validation <xref ref-type="bibr" rid="bib1.bibx58" id="paren.65"/>. Using this method, for each observation to be predicted, its nearest neighbor was excluded from the group of neighbors, and then a WA-PLS model is fitted using the remaining ones. This model is then used to predict the value of the response variable of the nearest observation. Predicted values are finally cross-validated with the actual values (see <xref ref-type="bibr" rid="bib1.bibx58" id="altparen.66"/>, for additional details). For the optimization of the nearest neighbor search, i.e., the nearest neighbor cross-validation, a grouping factor was used to avoid overfitting: keeping the nearest neighbor out, the model was trained with the remaining neighbors which were not from the same region as the hold-out neighbor (region corresponds to the sentinel sites within the AfSIS SSL). The minimum number of available<?pagebreak page701?> neighbors was tested for each region prior to training the respective final models, which were then trained with neighborhood sizes varying from 150 to 500 neighbors in increments of 10. The best model and the optimal number of neighbors were determined by the minimal RMSE (Eq. <xref ref-type="disp-formula" rid="Ch1.E15"/>) of the nearest neighbor cross-validation, where <inline-formula><mml:math id="M147" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> is the number of neighbors used for the model, <inline-formula><mml:math id="M148" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">y</mml:mi><mml:mi mathvariant="bold-italic">i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the measured value of the hold-out neighbor, and <inline-formula><mml:math id="M149" display="inline"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi mathvariant="bold-italic">y</mml:mi><mml:mo mathvariant="normal" stretchy="true">^</mml:mo></mml:mover><mml:mi mathvariant="bold-italic">i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the value predicted by the remaining neighbors.</p>
      <p id="d1e3386">Subsequently, independent from their distances to the validation set, 1 to 20 spiking samples were added from the target region and forced into the neighborhood of every observation and thus used in the predictive models. Our approach differs from previous studies using local modeling methods in combination with spiking, where the samples were not forced into the neighborhoods (e.g. <xref ref-type="bibr" rid="bib1.bibx6 bib1.bibx41" id="altparen.67"/>). Our approach guarantees that the spiking set (which is assumed to carry important information) is fully used.</p>
      <p id="d1e3392">Stepwise spiking was applied to test the effect of spiking in general and to find the smallest number of samples required for satisfying model performances. This was necessary since soil samples from the same geographical region are usually governed by very similar formation processes (spatial autocorrelation; <xref ref-type="bibr" rid="bib1.bibx26" id="altparen.68"/>), and MIR spectra partially reflect the compositional characteristics of these samples. Moreover, it is widely accepted that the most accurate predictions can be achieved by models built with samples originating from the same region because large nonlinear complexity is avoided <xref ref-type="bibr" rid="bib1.bibx78" id="paren.69"><named-content content-type="pre">e.g.,</named-content></xref>.</p>
</sec>
<sec id="Ch1.S2.SS8">
  <label>2.8</label><title>Model validation and prediction accuracy</title>
      <p id="d1e3411">For model validation, the RMSE statistics of the nearest neighbor cross-validation described in the previous section were used. Prediction accuracy of the predicted vs. the measured values was also calculated using RMSE (Eq. <xref ref-type="disp-formula" rid="Ch1.E15"/>), where in this case <inline-formula><mml:math id="M150" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">y</mml:mi><mml:mi mathvariant="bold-italic">i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the actual measured reference value and <inline-formula><mml:math id="M151" display="inline"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi mathvariant="bold-italic">y</mml:mi><mml:mo stretchy="true" mathvariant="normal">^</mml:mo></mml:mover><mml:mi mathvariant="bold-italic">i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> the prediction of the final model.
            <disp-formula id="Ch1.E15" content-type="numbered"><label>15</label><mml:math id="M152" display="block"><mml:mrow><mml:mtext>RMSE</mml:mtext><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mstyle><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="bold-italic">y</mml:mi><mml:mi mathvariant="bold-italic">i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi mathvariant="bold-italic">y</mml:mi><mml:mo mathvariant="normal" stretchy="true">^</mml:mo></mml:mover><mml:mi mathvariant="bold-italic">i</mml:mi></mml:msub><mml:msup><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:msqrt></mml:mrow></mml:math></disp-formula></p>
      <p id="d1e3492">Model validation and prediction performance were additionally evaluated using the mean error (ME; mean of the absolute difference between predicted and observed values) and the ratio of performance to the interquartile distance (RPIQ; <xref ref-type="bibr" rid="bib1.bibx15" id="altparen.70"/>). For calculating RPIQ, the interquartile range of the observed reference data is divided by the RMSE of the nearest neighbor validation or by the RMSE of the prediction (RMSE<inline-formula><mml:math id="M153" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>). This is particularly useful since RPIQ does not make any assumptions about the distribution of the reference data.</p>
</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Results</title>
      <p id="d1e3516">The samples that comprise the CSSL exhibited a wide range of TC and TN contents (Fig. <xref ref-type="fig" rid="Ch1.F2"/>). Validation and spiking sets for four of the six regions (Haut-Katanga, Tshopo, Tshuapa, Kabarole) had mean TC and TN of 9.30–18.10 and 0.95–1.74 <inline-formula><mml:math id="M154" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, respectively. Maximum TC and TN values for these four regions were 56.69 and 5.05 <inline-formula><mml:math id="M155" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, respectively. The other two regions, South Kivu in the eastern DRC and Iburengerazuba in western Rwanda, had considerably higher TC and TN contents, with mean values of 23.55–35.43 and 1.34–3.07 <inline-formula><mml:math id="M156" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, respectively. The AfSIS SSL had generally lower mean TC and TN contents of 12.37 and 0.82 <inline-formula><mml:math id="M157" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, respectively.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F2" specific-use="star"><?xmltex \currentcnt{2}?><?xmltex \def\figurename{Figure}?><label>Figure 2</label><caption><p id="d1e3591">Summary of the reference data for total carbon (TC) and total nitrogen (TN) of the two soil spectral libraries (SSLs): the central African SSL (CSSL) and the continental SSL (AfSIS SSL). The CSSL is divided into the six regions (Haut-Katanga, South Kivu, Tshopo, Tshuapa, Iburengerazuba, Kabarole). The black lines and text indicate regional validation sets, while the gray lines and text indicate the spiking sets.</p></caption>
        <?xmltex \igopts{width=497.923228pt}?><graphic xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021-f02.png"/>

      </fig>

<?xmltex \hack{\newpage}?>
<?pagebreak page702?><sec id="Ch1.S3.SS1">
  <label>3.1</label><title>Principal components and spectral variability in the two libraries</title>
      <p id="d1e3610">The first three principal components accounted for 85 <inline-formula><mml:math id="M158" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">%</mml:mi></mml:mrow></mml:math></inline-formula> of the spectral variability (Fig. <xref ref-type="fig" rid="Ch1.F3"/>). These components indicate that the majority of CSSL samples lie within the spectral domains of the AfSIS SSL as their PCA scores overlap. This overlapping is, however, less evident for the spectra of the South Kivu region and, to a lesser extent, for the samples of the Iburengerazuba and Tshuapa regions, which suggests that the type of soils in these regions may not be well represented by the AfSIS SSL compared to the other regions.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F3" specific-use="star"><?xmltex \currentcnt{3}?><?xmltex \def\figurename{Figure}?><label>Figure 3</label><caption><p id="d1e3625">Score plots of the first three principal components of the preprocessed MIR spectra from the central African soil spectral library (six regions; colored) and the large-scale continental library (AfSIS SSL; gray).</p></caption>
          <?xmltex \igopts{width=497.923228pt}?><graphic xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021-f03.png"/>

        </fig>

</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title>Predictive performance of the three strategies</title>
      <p id="d1e3642">In general, MBL retrieved accurate TC and TN predictions for all the strategies (with RMSE<inline-formula><mml:math id="M159" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values below 9 <inline-formula><mml:math id="M160" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for TC and below 1.7 <inline-formula><mml:math id="M161" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for TN). South Kivu and Iburengerazuba regions showed the highest RMSE<inline-formula><mml:math id="M162" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>, which was mainly due to the high TC and TN ranges (Fig. <xref ref-type="fig" rid="Ch1.F2"/>). Prediction errors for Haut-Katanga, Tshopo, and Tshuapa were comparably smaller; however, the RPIQ<inline-formula><mml:math id="M163" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values were among the smallest across regions as well (RPIQ<inline-formula><mml:math id="M164" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> 0.59–2.72). Relative to their TC and TN ranges, predictions for these three regions were less accurate than for South Kivu and Iburengerazuba (PRIQ<inline-formula><mml:math id="M165" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> 1.10–4.45). The TC and TN predictions in Kabarole were the most accurate compared with the other five regions (RPIQ<inline-formula><mml:math id="M166" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> 2.65–5.48 for TC and TN and all strategies; Table <xref ref-type="table" rid="Ch1.T3"/>).</p>

<?xmltex \floatpos{t}?><table-wrap id="Ch1.T3" specific-use="star"><?xmltex \currentcnt{3}?><label>Table 3</label><caption><p id="d1e3741"> Statistics of the independent validations of the predictions of total carbon and total nitrogen for each region and three strategies. Strategy 1: predictions of the combined six regions by the AfSIS soil spectral library (SSL); strategy 2: predictions of the individual regions by the remaining five regions together with the AfSIS SSL; strategy 3: spiking six regional models from strategy 2 with 20 samples from each target area.</p></caption><oasis:table frame="topbot"><?xmltex \begin{scaleboxenv}{.95}[.95]?><oasis:tgroup cols="12">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right" colsep="1"/>
     <oasis:colspec colnum="8" colname="col8" align="right"/>
     <oasis:colspec colnum="9" colname="col9" align="right"/>
     <oasis:colspec colnum="10" colname="col10" align="right"/>
     <oasis:colspec colnum="11" colname="col11" align="right"/>
     <oasis:colspec colnum="12" colname="col12" align="right"/>
     <oasis:thead>
       <oasis:row>

         <oasis:entry colname="col1">Strategy</oasis:entry>

         <oasis:entry colname="col2">Region</oasis:entry>

         <oasis:entry rowsep="1" namest="col3" nameend="col7" align="center" colsep="1">Total carbon (<inline-formula><mml:math id="M167" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>) </oasis:entry>

         <oasis:entry rowsep="1" namest="col8" nameend="col12" align="center">Total nitrogen (<inline-formula><mml:math id="M168" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>) </oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1"/>

         <oasis:entry colname="col2"/>

         <oasis:entry colname="col3"><inline-formula><mml:math id="M169" display="inline"><mml:mrow><mml:msub><mml:mi>n</mml:mi><mml:mtext>pred</mml:mtext></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col4">RMSE<inline-formula><mml:math id="M170" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col5"><inline-formula><mml:math id="M171" display="inline"><mml:mrow><mml:msubsup><mml:mi>R</mml:mi><mml:mtext>pred</mml:mtext><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col6">ME<inline-formula><mml:math id="M172" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col7">RPIQ<inline-formula><mml:math id="M173" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col8"><inline-formula><mml:math id="M174" display="inline"><mml:mrow><mml:msub><mml:mi>n</mml:mi><mml:mtext>pred</mml:mtext></mml:msub></mml:mrow></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col9">RMSE<inline-formula><mml:math id="M175" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col10"><inline-formula><mml:math id="M176" display="inline"><mml:mrow><mml:msubsup><mml:mi>R</mml:mi><mml:mtext>pred</mml:mtext><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col11">ME<inline-formula><mml:math id="M177" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col12">RPIQ<inline-formula><mml:math id="M178" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula></oasis:entry>

       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>

         <oasis:entry rowsep="1" colname="col1" morerows="5">Strategy 1</oasis:entry>

         <oasis:entry colname="col2">Haut-Katanga</oasis:entry>

         <oasis:entry colname="col3">99</oasis:entry>

         <oasis:entry colname="col4">5.99</oasis:entry>

         <oasis:entry colname="col5">0.79</oasis:entry>

         <oasis:entry colname="col6">4.99</oasis:entry>

         <oasis:entry colname="col7">1.62</oasis:entry>

         <oasis:entry colname="col8">99</oasis:entry>

         <oasis:entry colname="col9">0.81</oasis:entry>

         <oasis:entry colname="col10">0.31</oasis:entry>

         <oasis:entry colname="col11">0.70</oasis:entry>

         <oasis:entry colname="col12">0.59</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">South Kivu</oasis:entry>

         <oasis:entry colname="col3">347</oasis:entry>

         <oasis:entry colname="col4">8.61</oasis:entry>

         <oasis:entry colname="col5">0.94</oasis:entry>

         <oasis:entry colname="col6">3.50</oasis:entry>

         <oasis:entry colname="col7">2.43</oasis:entry>

         <oasis:entry colname="col8">348</oasis:entry>

         <oasis:entry colname="col9">1.66</oasis:entry>

         <oasis:entry colname="col10">0.85</oasis:entry>

         <oasis:entry colname="col11">1.32</oasis:entry>

         <oasis:entry colname="col12">1.10</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshopo</oasis:entry>

         <oasis:entry colname="col3">114</oasis:entry>

         <oasis:entry colname="col4">7.34</oasis:entry>

         <oasis:entry colname="col5">0.47</oasis:entry>

         <oasis:entry colname="col6">2.61</oasis:entry>

         <oasis:entry colname="col7">0.96</oasis:entry>

         <oasis:entry colname="col8">129</oasis:entry>

         <oasis:entry colname="col9">0.55</oasis:entry>

         <oasis:entry colname="col10">0.52</oasis:entry>

         <oasis:entry colname="col11">0.34</oasis:entry>

         <oasis:entry colname="col12">0.93</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshuapa</oasis:entry>

         <oasis:entry colname="col3">718</oasis:entry>

         <oasis:entry colname="col4">3.85</oasis:entry>

         <oasis:entry colname="col5">0.71</oasis:entry>

         <oasis:entry colname="col6">2.06</oasis:entry>

         <oasis:entry colname="col7">1.84</oasis:entry>

         <oasis:entry colname="col8">718</oasis:entry>

         <oasis:entry colname="col9">0.40</oasis:entry>

         <oasis:entry colname="col10">0.68</oasis:entry>

         <oasis:entry colname="col11">0.29</oasis:entry>

         <oasis:entry colname="col12">1.37</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Iburengerazuba</oasis:entry>

         <oasis:entry colname="col3">84</oasis:entry>

         <oasis:entry colname="col4">8.73</oasis:entry>

         <oasis:entry colname="col5">0.84</oasis:entry>

         <oasis:entry colname="col6">4.46</oasis:entry>

         <oasis:entry colname="col7">2.60</oasis:entry>

         <oasis:entry colname="col8">84</oasis:entry>

         <oasis:entry colname="col9">0.82</oasis:entry>

         <oasis:entry colname="col10">0.81</oasis:entry>

         <oasis:entry colname="col11">0.60</oasis:entry>

         <oasis:entry colname="col12">2.13</oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col2">Kabarole</oasis:entry>

         <oasis:entry colname="col3">80</oasis:entry>

         <oasis:entry colname="col4">5.73</oasis:entry>

         <oasis:entry colname="col5">0.86</oasis:entry>

         <oasis:entry colname="col6">1.10</oasis:entry>

         <oasis:entry colname="col7">3.95</oasis:entry>

         <oasis:entry colname="col8">80</oasis:entry>

         <oasis:entry colname="col9">0.65</oasis:entry>

         <oasis:entry colname="col10">0.84</oasis:entry>

         <oasis:entry colname="col11">0.47</oasis:entry>

         <oasis:entry colname="col12">2.86</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry rowsep="1" colname="col1" morerows="5">Strategy 2</oasis:entry>

         <oasis:entry colname="col2">Haut-Katanga</oasis:entry>

         <oasis:entry colname="col3">99</oasis:entry>

         <oasis:entry colname="col4">4.22</oasis:entry>

         <oasis:entry colname="col5">0.72</oasis:entry>

         <oasis:entry colname="col6">1.84</oasis:entry>

         <oasis:entry colname="col7">2.30</oasis:entry>

         <oasis:entry colname="col8">99</oasis:entry>

         <oasis:entry colname="col9">0.32</oasis:entry>

         <oasis:entry colname="col10">0.59</oasis:entry>

         <oasis:entry colname="col11">0.02</oasis:entry>

         <oasis:entry colname="col12">1.50</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">South Kivu</oasis:entry>

         <oasis:entry colname="col3">347</oasis:entry>

         <oasis:entry colname="col4">8.88</oasis:entry>

         <oasis:entry colname="col5">0.95</oasis:entry>

         <oasis:entry colname="col6">4.72</oasis:entry>

         <oasis:entry colname="col7">2.36</oasis:entry>

         <oasis:entry colname="col8">348</oasis:entry>

         <oasis:entry colname="col9">1.17</oasis:entry>

         <oasis:entry colname="col10">0.89</oasis:entry>

         <oasis:entry colname="col11">0.72</oasis:entry>

         <oasis:entry colname="col12">1.55</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshopo</oasis:entry>

         <oasis:entry colname="col3">114</oasis:entry>

         <oasis:entry colname="col4">5.38</oasis:entry>

         <oasis:entry colname="col5">0.64</oasis:entry>

         <oasis:entry colname="col6">0.30</oasis:entry>

         <oasis:entry colname="col7">1.31</oasis:entry>

         <oasis:entry colname="col8">129</oasis:entry>

         <oasis:entry colname="col9">0.34</oasis:entry>

         <oasis:entry colname="col10">0.72</oasis:entry>

         <oasis:entry colname="col11">0.07</oasis:entry>

         <oasis:entry colname="col12">1.49</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshuapa</oasis:entry>

         <oasis:entry colname="col3">718</oasis:entry>

         <oasis:entry colname="col4">4.12</oasis:entry>

         <oasis:entry colname="col5">0.78</oasis:entry>

         <oasis:entry colname="col6">2.21</oasis:entry>

         <oasis:entry colname="col7">1.71</oasis:entry>

         <oasis:entry colname="col8">718</oasis:entry>

         <oasis:entry colname="col9">0.29</oasis:entry>

         <oasis:entry colname="col10">0.77</oasis:entry>

         <oasis:entry colname="col11">0.12</oasis:entry>

         <oasis:entry colname="col12">1.88</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Iburengerazuba</oasis:entry>

         <oasis:entry colname="col3">84</oasis:entry>

         <oasis:entry colname="col4">7.96</oasis:entry>

         <oasis:entry colname="col5">0.86</oasis:entry>

         <oasis:entry colname="col6">2.69</oasis:entry>

         <oasis:entry colname="col7">2.84</oasis:entry>

         <oasis:entry colname="col8">84</oasis:entry>

         <oasis:entry colname="col9">0.54</oasis:entry>

         <oasis:entry colname="col10">0.82</oasis:entry>

         <oasis:entry colname="col11">0.02</oasis:entry>

         <oasis:entry colname="col12">3.21</oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col2">Kabarole</oasis:entry>

         <oasis:entry colname="col3">80</oasis:entry>

         <oasis:entry colname="col4">8.56</oasis:entry>

         <oasis:entry colname="col5">0.83</oasis:entry>

         <oasis:entry colname="col6">4.29</oasis:entry>

         <oasis:entry colname="col7">2.65</oasis:entry>

         <oasis:entry colname="col8">80</oasis:entry>

         <oasis:entry colname="col9">0.64</oasis:entry>

         <oasis:entry colname="col10">0.86</oasis:entry>

         <oasis:entry colname="col11">0.40</oasis:entry>

         <oasis:entry colname="col12">2.90</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col1" morerows="5">Strategy 3</oasis:entry>

         <oasis:entry colname="col2">Haut-Katanga</oasis:entry>

         <oasis:entry colname="col3">99</oasis:entry>

         <oasis:entry colname="col4">3.57</oasis:entry>

         <oasis:entry colname="col5">0.80</oasis:entry>

         <oasis:entry colname="col6">1.35</oasis:entry>

         <oasis:entry colname="col7">2.72</oasis:entry>

         <oasis:entry colname="col8">99</oasis:entry>

         <oasis:entry colname="col9">0.26</oasis:entry>

         <oasis:entry colname="col10">0.71</oasis:entry>

         <oasis:entry colname="col11">0.06</oasis:entry>

         <oasis:entry colname="col12">1.87</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">South Kivu</oasis:entry>

         <oasis:entry colname="col3">347</oasis:entry>

         <oasis:entry colname="col4">7.32</oasis:entry>

         <oasis:entry colname="col5">0.95</oasis:entry>

         <oasis:entry colname="col6">1.53</oasis:entry>

         <oasis:entry colname="col7">2.86</oasis:entry>

         <oasis:entry colname="col8">348</oasis:entry>

         <oasis:entry colname="col9">0.89</oasis:entry>

         <oasis:entry colname="col10">0.89</oasis:entry>

         <oasis:entry colname="col11">0.32</oasis:entry>

         <oasis:entry colname="col12">2.05</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshopo</oasis:entry>

         <oasis:entry colname="col3">114</oasis:entry>

         <oasis:entry colname="col4">4.93</oasis:entry>

         <oasis:entry colname="col5">0.69</oasis:entry>

         <oasis:entry colname="col6">0.11</oasis:entry>

         <oasis:entry colname="col7">1.43</oasis:entry>

         <oasis:entry colname="col8">129</oasis:entry>

         <oasis:entry colname="col9">0.31</oasis:entry>

         <oasis:entry colname="col10">0.75</oasis:entry>

         <oasis:entry colname="col11">0.03</oasis:entry>

         <oasis:entry colname="col12">1.62</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshuapa</oasis:entry>

         <oasis:entry colname="col3">718</oasis:entry>

         <oasis:entry colname="col4">3.19</oasis:entry>

         <oasis:entry colname="col5">0.80</oasis:entry>

         <oasis:entry colname="col6">0.90</oasis:entry>

         <oasis:entry colname="col7">2.22</oasis:entry>

         <oasis:entry colname="col8">718</oasis:entry>

         <oasis:entry colname="col9">0.24</oasis:entry>

         <oasis:entry colname="col10">0.79</oasis:entry>

         <oasis:entry colname="col11">0.03</oasis:entry>

         <oasis:entry colname="col12">2.25</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Iburengerazuba</oasis:entry>

         <oasis:entry colname="col3">84</oasis:entry>

         <oasis:entry colname="col4">6.34</oasis:entry>

         <oasis:entry colname="col5">0.91</oasis:entry>

         <oasis:entry colname="col6">1.14</oasis:entry>

         <oasis:entry colname="col7">3.57</oasis:entry>

         <oasis:entry colname="col8">84</oasis:entry>

         <oasis:entry colname="col9">0.39</oasis:entry>

         <oasis:entry colname="col10">0.91</oasis:entry>

         <oasis:entry colname="col11">0.03</oasis:entry>

         <oasis:entry colname="col12">4.45</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Kabarole</oasis:entry>

         <oasis:entry colname="col3">80</oasis:entry>

         <oasis:entry colname="col4">4.13</oasis:entry>

         <oasis:entry colname="col5">0.94</oasis:entry>

         <oasis:entry colname="col6">1.72</oasis:entry>

         <oasis:entry colname="col7">5.48</oasis:entry>

         <oasis:entry colname="col8">80</oasis:entry>

         <oasis:entry colname="col9">0.44</oasis:entry>

         <oasis:entry colname="col10">0.91</oasis:entry>

         <oasis:entry colname="col11">0.23</oasis:entry>

         <oasis:entry colname="col12">4.27</oasis:entry>

       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup><?xmltex \end{scaleboxenv}?></oasis:table></table-wrap>

      <?xmltex \floatpos{p}?><fig id="Ch1.F4" specific-use="star"><?xmltex \currentcnt{4}?><?xmltex \def\figurename{Figure}?><label>Figure 4</label><caption><p id="d1e4640">Predicted vs. measured total carbon (TC) and total nitrogen (TN) for soil samples of the six central African regions. Predictions for each region were made using memory-based learning and (i) the large-scale continental soil spectral library (AfSIS SSL; strategy 1); (ii) the remaining five central African regions together with the AfSIS SSL (strategy 2); and (iii) 20 local spiking samples from each target region, together with the remaining five central African regions and the AfSIS SSL (strategy 3). A <inline-formula><mml:math id="M179" display="inline"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>:</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> line is indicated as a visual aid.</p></caption>
          <?xmltex \igopts{width=483.69685pt}?><graphic xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021-f04.png"/>

        </fig>

<?pagebreak page703?><sec id="Ch1.S3.SS2.SSS1">
  <label>3.2.1</label><title>Strategy 1: predicted central African soils by the large-scale continental library</title>
      <?pagebreak page705?><p id="d1e4669">The TC and TN predictions for the six regions of central Africa were characterized by errors (RMSE<inline-formula><mml:math id="M180" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>) ranging from 3.85–8.73 and 0.40–1.66 <inline-formula><mml:math id="M181" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>, respectively. The best prediction accuracies for TC were achieved for South Kivu, Iburengerazuba, and Kabarole, where RPIQ<inline-formula><mml:math id="M182" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values were between 2.43–3.95, while Tshopo, Tshuapa, and Haut-Katanga performed worse with RPIQ<inline-formula><mml:math id="M183" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub><mml:mo>&lt;</mml:mo><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.84</mml:mn></mml:mrow></mml:math></inline-formula>. For TN, Iburengerazuba and Kabarole performed well, with RPIQ<inline-formula><mml:math id="M184" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> above 2. However, the four other regions, Haut-Katanga, South Kivu, Tshopo, and Tshuapa, exhibited even lower RPIQ<inline-formula><mml:math id="M185" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub><mml:mo>&lt;</mml:mo><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.37</mml:mn></mml:mrow></mml:math></inline-formula>. For South Kivu, samples with high TC and TN contents (<inline-formula><mml:math id="M186" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">100</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M187" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> TC and <inline-formula><mml:math id="M188" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M189" display="inline"><mml:mrow class="unit"><mml:mspace width="0.125em" linebreak="nobreak"/></mml:mrow></mml:math></inline-formula><inline-formula><mml:math id="M190" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> TN) deviated from the <inline-formula><mml:math id="M191" display="inline"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>:</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> line (Fig. <xref ref-type="fig" rid="Ch1.F4"/>). Moreover, TC predictions for Haut-Katanga, Tshopo, Tshuapa and Iburengerazuba, as well as TN predictions, in all six regions showed a clear trend towards underestimation  (Fig. <xref ref-type="fig" rid="Ch1.F4"/>). This can be caused by one or a combination of the three following effects: (i) the central African samples were poorly represented by the continental AfSIS SSL due to the differing pedogenic features (Fig. <xref ref-type="fig" rid="Ch1.F3"/>); (ii) the preprocessing methods did not completely account for the spectral offset and/or multiplicative effects in the spectra (due to instrument differences); and (iii) performance differences exist between the conventional laboratory analyses used to obtain TC and TN reference values.</p>
</sec>
<sec id="Ch1.S3.SS2.SSS2">
  <label>3.2.2</label><title>Strategy 2: regional predictions by soil spectral libraries</title>
      <p id="d1e4836">Compared with strategy 1, strategy 2 partially showed better predictive performance for TC and in all the cases retrieved better TN predictions. These improvements are exemplified by the larger RPIQ<inline-formula><mml:math id="M192" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> and smaller RMSE<inline-formula><mml:math id="M193" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values in strategy 2 (Table <xref ref-type="table" rid="Ch1.T3"/>). The most accurate predictions for TC were obtained for the regions Haut-Katanga, South Kivu, Iburengerazuba, and Kabarole (RPIQ<inline-formula><mml:math id="M194" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">2.30</mml:mn></mml:mrow></mml:math></inline-formula>). The predictive performances for TC of Tshopo and Tshuapa were similar, with RPIQ<inline-formula><mml:math id="M195" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values of 1.31 and 1.71, respectively. For TN, the predictive performance was best for Iburengerazuba and Kabarole (RPIQ<inline-formula><mml:math id="M196" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula>). For the regions Haut-Katanga, South Kivu, Tshopo, and Tshuapa, the RPIQ<inline-formula><mml:math id="M197" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values for TN were between 1.49–1.88. The predictions in strategy 2 exhibited errors (RMSE<inline-formula><mml:math id="M198" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>) ranging between 4.12–8.88 and 0.29–1.17 <inline-formula><mml:math id="M199" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> for TC and TN, respectively (Table <xref ref-type="table" rid="Ch1.T3"/>). Comparing the TC RMSE<inline-formula><mml:math id="M200" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> of each region across the first two strategies, errors for Haut Katanga, Tshopo, and Iburengerazuba were substantially reduced in strategy 2. Two regions performed equally well (South Kivu and Tshuapa) in both strategies, and only one region (Kabarole) saw an increase in errors (Table <xref ref-type="table" rid="Ch1.T3"/>). For all regions, TN prediction errors (RMSE<inline-formula><mml:math id="M201" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>) were consistently lower in strategy 2 than strategy 1 (Table <xref ref-type="table" rid="Ch1.T3"/>). The <inline-formula><mml:math id="M202" display="inline"><mml:mrow><mml:msubsup><mml:mi>R</mml:mi><mml:mtext>pred</mml:mtext><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula> values of the TC and TN predictions indicate that the precision of such models was, in general, equal or slightly better for strategy 2 than for strategy 1.</p>
</sec>
<sec id="Ch1.S3.SS2.SSS3">
  <label>3.2.3</label><title>Strategy 3: spiking of the regional models</title>
      <p id="d1e4978">For all regions, spiking the regional models with up to 20 local samples from each corresponding regional spiking set <inline-formula><mml:math id="M203" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="normal">K</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> consistently produced lower prediction errors (Fig. <xref ref-type="fig" rid="Ch1.F5"/>) compared to strategy 1 and strategy 2. For Haut-Katanga, Tshopo, Tshuapa, and Iburengerazuba, the RMSE<inline-formula><mml:math id="M204" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> for TC and TN could be reduced with 10 to 13 spiking samples and did not change substantially thereafter (Fig. <xref ref-type="fig" rid="Ch1.F5"/>). In contrast, for South Kivu and Kabarole, RMSE<inline-formula><mml:math id="M205" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values were minimized, with 16 or more spiking samples from each target region (Fig. <xref ref-type="fig" rid="Ch1.F5"/>). To present the strong and contrasting effect of foregoing any spatial extrapolation in strategy 3, the results for 20 spiking samples are presented in Table <xref ref-type="table" rid="Ch1.T3"/> and Fig. <xref ref-type="fig" rid="Ch1.F4"/>. The strongest reduction of the RMSE<inline-formula><mml:math id="M206" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> for TC in strategy 3 (with 20 spiking samples) compared to strategy 2 (no spiking) was achieved for Kabarole (4.44 <inline-formula><mml:math id="M207" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>), Iburengerazuba (1.62 <inline-formula><mml:math id="M208" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>), and South Kivu (1.56 <inline-formula><mml:math id="M209" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>), followed by Tshuapa, Haut-Katanga, and Tshopo, which decreased by 0.45–0.93 <inline-formula><mml:math id="M210" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>. Similarly, shifting from strategy 2 to 3 had the strongest effect on the RMSE<inline-formula><mml:math id="M211" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> for TN for South Kivu (0.2 <inline-formula><mml:math id="M212" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>), for Kabarole (0.2 <inline-formula><mml:math id="M213" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>), and for Iburengerazuba (0.15 <inline-formula><mml:math id="M214" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>), whereas differences were smaller for Haut-Katanga, Tshuapa, and Tshopo (0.03–0.06 <inline-formula><mml:math id="M215" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>). Strategy 3 also resulted in predictions that better represented the measured values (consistently higher <inline-formula><mml:math id="M216" display="inline"><mml:mrow><mml:msubsup><mml:mi>R</mml:mi><mml:mtext>pred</mml:mtext><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula> and RPIQ<inline-formula><mml:math id="M217" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values than in strategy 1 or 2; Table <xref ref-type="table" rid="Ch1.T3"/>). The Kabarole region showed the best predictive performance for TC in strategy 3 (RPIQ<inline-formula><mml:math id="M218" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> of 5.48), followed by Iburengerazuba, South Kivu, Haut-Katanga, and Tshuapa (RPIQ<inline-formula><mml:math id="M219" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> 2.22–3.57). For TN, Iburengerazuba, Kabarole, South Kivu, Tshuapa, and Haut-Katanga showed accurate predictions (RPIQ<inline-formula><mml:math id="M220" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> of 1.87–4.45). RPIQ<inline-formula><mml:math id="M221" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values for the predictions of TC and TN for Tshopo were less than 2 (RPIQ<inline-formula><mml:math id="M222" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> TC: 1.43 and RPIQ<inline-formula><mml:math id="M223" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> TN: 1.62). However, the trend from strategy 1 to strategy 3 was a clear reduction in prediction errors and an increase in accuracy.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F5" specific-use="star"><?xmltex \currentcnt{5}?><?xmltex \def\figurename{Figure}?><label>Figure 5</label><caption><p id="d1e5258">Root mean square error of predicted total carbon <bold>(a)</bold> and total nitrogen (<bold>b</bold>; RMSE<inline-formula><mml:math id="M224" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>) for the six regions of central Africa built from the pooled continental library (AfSIS SSL) together with the five remaining central African regions and 0 up to 20 spiking samples. No spiking samples represents strategy 2, and 1 up to 20 spiking samples shows strategy 3. The 20 spiking samples were selected from each particular target area and added stepwise to the predictive models in order to find the lowest number of spiking samples that reduces the prediction accuracy to a satisfactory tolerance level.</p></caption>
            <?xmltex \igopts{width=398.338583pt}?><graphic xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021-f05.png"/>

          </fig>

</sec>
</sec>
</sec>
<sec id="Ch1.S4">
  <label>4</label><title>Discussion</title>
<sec id="Ch1.S4.SS1">
  <label>4.1</label><title>Strategy 1 and strategy 2: using soil spectral libraries outside of their respective geographical domains</title>
      <p id="d1e5299">Our analysis shows that TC and TN in six regions of our CSSL can be reasonably well predicted through the use of existing SSLs comprised of soils from completely different geographical areas and without any local samples using MBL methods (RMSE<inline-formula><mml:math id="M225" display="inline"><mml:mrow><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">9</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M226" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace width="0.125em" linebreak="nobreak"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> TC and <inline-formula><mml:math id="M227" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0.17</mml:mn></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M228" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> TN, Table <xref ref-type="table" rid="Ch1.T3"/>). The resulting prediction errors were comparable to other large-scale MIR prediction studies <xref ref-type="bibr" rid="bib1.bibx21 bib1.bibx1" id="paren.71"><named-content content-type="pre">e.g.,</named-content></xref> and also to other soil infrared studies, which analyzed geographical extrapolation possibilities <xref ref-type="bibr" rid="bib1.bibx54 bib1.bibx17 bib1.bibx28" id="paren.72"><named-content content-type="pre">e.g.,</named-content></xref>. The advantage of using MBL as the method to build prediction models is that it finds similar spectral observations for every new observation to fit suitable models. This approach works efficiently since spectral similarity is in fact reflecting the similarity between observations in terms of soil composition, information which is largely contained in the MIR features of a sample. This means that the predictive success of MBL models largely depends on the quality of the spectra dissimilarity methods used to find spectral neighbors. In other words, MBL can be described as a method driven by compositional similarity search. The improved prediction accuracy (lower RMSE<inline-formula><mml:math id="M229" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> and higher RPIQ<inline-formula><mml:math id="M230" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula>) when reducing extrapolation (strategy 2) can be explained by the addition of more proximal central African soil samples to the library that are more similar to each predicted region. The continental AfSIS SSL is missing data for most of central Africa (Fig. <xref ref-type="fig" rid="Ch1.F1"/>); none of the tropical forest soils with high contents of organic carbon or with<?pagebreak page706?> distinctive mineral–organic composition are covered by this large-scale SSL. Naturally, this variability impacts the generalization ability of any predictive model or modeling strategy. Moreover, variance arising from instrument and reference laboratory differences was avoided through the use of local models. However, it is not clear why Kabarole exhibited higher prediction errors in strategy 2. A possible reason could be random variance (Fig. <xref ref-type="fig" rid="Ch1.F4"/>) or nonlinearity. Two regions (South Kivu and Tshuapa) did not show any substantial changes on RMSE<inline-formula><mml:math id="M231" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> and RPIQ<inline-formula><mml:math id="M232" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values for TC when comparing strategy 1 and strategy 2. Note that both South Kivu and to some extent also Tshuapa cover a distinct score space in Fig. <xref ref-type="fig" rid="Ch1.F3"/> and therefore are not well represented by the remaining central African regions, nor by the AfSIS SSL.</p>
      <p id="d1e5416">All central African regions from the CSSL show large variability in TC and TN contents (Fig. <xref ref-type="fig" rid="Ch1.F2"/>) and contain samples from various land cover (forest/croplands), altitudes (Table <xref ref-type="table" rid="Ch1.T2"/>), and parent materials. These differences suggest that soils have developed and been transformed under a variety of environmental conditions. For example, high diversity in organic compounds and their stabilization in soils (i.e., organo–mineral association, complexation, aggregation) can introduce nonlinear relationships  that are difficult to predict with locally linear calibration methods (i.e., memory-based learning in combination with PLS regression). Thus, we conclude that the particularly high soil diversity in these two regions, in terms of biogeochemical and physical properties, introduces additional complexity into the soil spectral prediction workflow. Similarly high RMSEs have been shown in other studies for samples with organic carbon higher than 150 <inline-formula><mml:math id="M233" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula> <xref ref-type="bibr" rid="bib1.bibx52" id="paren.73"/>. As in our study, these high errors were attributed to high TC contents. To improve prediction accuracies for these diverse regions, more data are needed. The creation of subsets from large spectral libraries via spectral similarities, for example, has been shown to be effective to train calibration models <xref ref-type="bibr" rid="bib1.bibx86 bib1.bibx18 bib1.bibx62" id="paren.74"><named-content content-type="pre">e.g.,</named-content></xref>. Hence, in order to reduce uncertainties for regions in central Africa that are diverse in terms of soil chemical composition, in particular for the Great Lakes region, there is a pressing need to fill the existing gaps in the continental library by gathering more data on the ground.</p>
</sec>
<sec id="Ch1.S4.SS2">
  <label>4.2</label><title>Strategy 3: effect of spiking with local samples on prediction performance</title>
      <p id="d1e5456">The spiking of the calibration models with local target samples had a positive effect for all included regions (Fig. <xref ref-type="fig" rid="Ch1.F5"/> and Table <xref ref-type="table" rid="Ch1.T3"/>). Kabarole, Iburengerazuba, and South Kivu, which showed the most substantial reductions of RMSE<inline-formula><mml:math id="M234" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> for TC and TN by spiking, cover different land uses, high altitudes along the Albertine Rift, and larger climatic ranges (Table <xref ref-type="table" rid="Ch1.T2"/>). These soils are not adequately represented by the continental AfSIS SSL, nor by the remaining central African regions, and therefore exhibited a strong effect when spiked with local soil data. Although the effect of spiking on RMSE<inline-formula><mml:math id="M235" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> for TC and TN was somewhat smaller for the other included regions (Haut-Katanga, Tshopo, and Tshuapa), it still produced noticeable improvements compared to strategy 1 and strategy 2 (smaller RMSE<inline-formula><mml:math id="M236" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> and larger RPIQ<inline-formula><mml:math id="M237" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> values). The TC and TN ranges of Haut-Katanga, Tshopo, and Tshuapa were narrower, and they also seem to be better represented by each other and by the AfSIS SSL (with the exception of a few samples of Tshuapa; Fig. <xref ref-type="fig" rid="Ch1.F3"/>). In these three regions, sufficiently similar spectra were available, and the MBL found the required neighbors to build accurate models and predict<?pagebreak page707?> TC and TN, thus lowering the positive effect of spiking. Additionally, the weaker influence of spiking on soils of Tshopo (RPIQ<inline-formula><mml:math id="M238" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> TC: 1.43 and RPIQ<inline-formula><mml:math id="M239" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> TN: 1.62) can be explained by an outlier in the predictions (Fig. <xref ref-type="fig" rid="Ch1.F4"/>) and a slightly uneven distribution of the reference data between the validation and spiking sets (Fig. <xref ref-type="fig" rid="Ch1.F2"/>). In summary, spiking has already been shown to improve performance <xref ref-type="bibr" rid="bib1.bibx31 bib1.bibx64 bib1.bibx6" id="paren.75"><named-content content-type="pre">e.g.,</named-content></xref> and also proved its value in our study. However, a threshold of 20 samples poses non-negligible additional costs for laboratory reference analysis, and the benefit in terms of gain of accuracy by spiking depends on the region and is not always guaranteed. In some cases, however, a smaller number of spiking samples can substantially reduce the RMSE<inline-formula><mml:math id="M240" display="inline"><mml:msub><mml:mi/><mml:mtext>pred</mml:mtext></mml:msub></mml:math></inline-formula> (e.g. Iburengerazuba and Kabarole). The required prediction accuracy and additional investments depend hereby on the field of application. The achieved predictions and their errors from this study are more than satisfactory for the study of TC and TN dynamics and will improve the availability of high-resolution soil data of central Africa. Thus, spiking is recommended when soils are highly variable and show large distances to existing spectral libraries.</p>
</sec>
<sec id="Ch1.S4.SS3">
  <label>4.3</label><title>Suggestions for building new models and extending the existing spectral library</title>
      <p id="d1e5549">Our regional predictions of TC and TN show promising results when analyzing soils from geographically distinct areas in central Africa that are not covered by the continental AfSIS SSL (Fig. <xref ref-type="fig" rid="Ch1.F1"/>). Six central African regions were predicted for soil TC and TN with sufficient accuracy using the large-scale AfSIS soil spectral library only. The general positive effect of adding geographically closer samples to the AfSIS SSL (strategy 2) underlines the usability of spectral libraries for new regions. The generally positive effect of strategy 3, spiking of all regional predictions for TC and TN with samples from the target area, encourages the future amendment of currently existing libraries to improve prediction accuracy. To improve future soil analyses and to extend the geographical area covered by an SSL, we suggest the following workflow:
<list list-type="order"><list-item>
      <p id="d1e5556"><italic>Preprocessing</italic>. Different spectral preprocessing methods influence model and prediction performance. We suggest selecting the best preprocessing strategies using spectral projections and minimizing the reconstruction error (see Sect. <xref ref-type="sec" rid="Ch1.S2.SS4"/>).</p></list-item><list-item>
      <p id="d1e5564"><italic>Estimation of uncertainty for new samples</italic>. When analyzing new soil samples from a  region which is not covered by the existing SSL, samples with different composition and hence chemical properties are more likely to be introduced. Samples with high distances in the score space to the SSL cannot be predicted accurately with a high certainty, since they are often highly divergent from the SSL. We recommend that a preliminary graphical inspection of resampled and preprocessed spectra can already allow for recognition of differences. A further dimension reduction (e.g. with a PCA) with a subsequent 2D or 3D visualization of the first factors provides additional insights into dissimilarity.</p></list-item><list-item>
      <p id="d1e5570"><italic>Reference analysis for independent validation</italic>. If the new samples are from a completely new region or the new sample set tends to differ from the SSL, a certain number of validation samples is recommended to test for prediction accuracy. The number is dependent on the similarity/dissimilarity to the SSL.</p></list-item><list-item>
      <p id="d1e5576"><italic>Search for nearest neighbors and training of a model</italic>. Run an MBL algorithm to find the nearest neighbors of the new set and train a subsequent weighted average PLS regression.</p></list-item><list-item>
      <p id="d1e5582"><italic>Model validation</italic>. For predicting soil TC and TN and quantifying the error of these predictions in  new geographical regions, a new model validation is required. The nearest neighbor validation is a suitable method, as demonstrated  in this study.</p></list-item><list-item>
      <p id="d1e5588"><italic>Data and libraries made available to the community</italic>. The created CSSL is freely available to use and build upon at our GitHub repository at <uri>https://doi.org/10.5281/zenodo.4351254</uri> (last access: 20 December 2020). As shown with the AfSIS SSL, the application of already existing libraries and the extrapolation to new regions is accurate and suitable to estimate soil properties. However, to make predictions more accurate, especially for more diverse, heterogeneous, and complex soils, more data are required. As demonstrated, the addition of new geographical regions improves the overall prediction accuracy when more proximal central African regions were added to the large-scale library. These results encourage the use and amendment of existing libraries, rather than the construction of new, separate, and extensive databases. Given the existing distribution of samples in the new CSSL, it is especially important to increase the number of forest soils with high TC contents, which represent a large portion of the Congo Basin. The future enlargement of the CSSL, preferably facilitated by our suggested workflow, is crucial to fill the gap of soil information in this highly understudied part of the world and can be assisted by the soil science community by adopting a sharing-oriented open data policy.</p></list-item></list></p><?xmltex \hack{\newpage}?>
</sec>
</sec>
<?pagebreak page708?><sec id="Ch1.S5" sec-type="conclusions">
  <label>5</label><title>Conclusions</title>
      <p id="d1e5607">Our study presents the results and workflow for building the first central African SSL for predicting soil properties (TC and TN) using lab-based MIR spectroscopy in a crucial but understudied area of the African continent. Extrapolations were possible for central Africa and for all the six selected regions. Our results further demonstrate how MBL algorithms are useful to find spectral similarities and reduce the need for spiking when a new set covers the same score space as the existing library. These encouraging insights highlight the utility of spectral libraries for future applications, since they are not necessarily limited to certain geographical areas. Our approach of augmenting a smaller SSL with a continental SSL, even when scanned on different instruments, leads to reasonably accurate predictions for new regions, which allows for analyses of TC and TN dynamics in soils but also meets a competitive cost–benefit trade-off. Furthermore, the CSSL fills an appreciable continental gap of the continental-scale AfSIS SSL and contributes to covering an important range of soil variability with spectral data, particularly from tropical forests. However, in order to improve the accuracy of predicting soil organic matter across regions, especially for soil compartments with high TC and TN contents, our study highlights the need to extend the existing library into new regions. The inclusion of more samples and regions, in particular with more (varying) data of humid tropical forest soils, is crucial to fill existing gaps. Combining spectral libraries will allow for fast analyses of soil samples and provide spatially explicit data across humid tropical Africa.</p><?xmltex \hack{\clearpage}?>
</sec>

      
      </body>
    <back><app-group>

<?pagebreak page709?><app id="App1.Ch1.S1">
  <?xmltex \currentcnt{A}?><label>Appendix A</label><title/>

      <?xmltex \floatpos{h!}?><fig id="App1.Ch1.S1.F6"><?xmltex \currentcnt{A1}?><?xmltex \def\figurename{Figure}?><label>Figure A1</label><caption><p id="d1e5623">Locations and resampled spectra for the sampling regions (six selected central African regions with a <inline-formula><mml:math id="M241" display="inline"><mml:mo>∘</mml:mo></mml:math></inline-formula> symbol and the remaining four regions with a <inline-formula><mml:math id="M242" display="inline"><mml:mi mathvariant="italic">▿</mml:mi></mml:math></inline-formula> symbol). All samples are included in the archive of the spectral library for central Africa. For the Democratic Republic of Congo (DRC) and Rwanda (RWA), the regions correspond to provinces; for Uganda (UGA), the sampling region corresponds to a district. The average spectra of each region are shown (bold line) along with the individual sample spectra (transparent lines). Base map created using Natural Earth.</p></caption>
        <?xmltex \hack{\hsize\textwidth}?>
        <?xmltex \igopts{width=497.923228pt}?><graphic xlink:href="https://soil.copernicus.org/articles/7/693/2021/soil-7-693-2021-f06.png"/>

      </fig>

<?xmltex \hack{\clearpage}?><?xmltex \floatpos{h!}?><table-wrap id="App1.Ch1.S1.T4" orientation="landscape"><?xmltex \hack{\hsize\textwidth}?><?xmltex \currentcnt{A1}?><label>Table A1</label><caption><p id="d1e5653"> Number of samples, GPS coordinates, elevation, annual precipitation (AP), mean annual temperature (MAT), Köppen–Geiger climate classifications, and soil types for entire soil spectral library for the Democratic Republic of Congo, Rwanda and Uganda. Data were extracted for all coordinates from raster files. Climate data are sourced from <xref ref-type="bibr" rid="bib1.bibx25" id="text.76"/>, elevation from SRTM (90 m resolution; <xref ref-type="bibr" rid="bib1.bibx37" id="altparen.77"/>), Köppen–Geiger climate classifications from <xref ref-type="bibr" rid="bib1.bibx14" id="text.78"/>, and soil types from the Soil Atlas of Africa <xref ref-type="bibr" rid="bib1.bibx38 bib1.bibx35" id="paren.79"/>.</p></caption><oasis:table frame="topbot"><?xmltex \begin{scaleboxenv}{.95}[.95]?><oasis:tgroup cols="9">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right"/>
     <oasis:colspec colnum="8" colname="col8" align="left"/>
     <oasis:colspec colnum="9" colname="col9" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Region</oasis:entry>
         <oasis:entry colname="col2"><inline-formula><mml:math id="M243" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula></oasis:entry>
         <oasis:entry colname="col3">Longitude (<inline-formula><mml:math id="M244" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col4">Latitude (<inline-formula><mml:math id="M245" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>)</oasis:entry>
         <oasis:entry colname="col5">Elevation (m)</oasis:entry>
         <oasis:entry colname="col6">MAT (<inline-formula><mml:math id="M246" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C)</oasis:entry>
         <oasis:entry colname="col7">AP (mm)</oasis:entry>
         <oasis:entry colname="col8">Köppen–Geiger</oasis:entry>
         <oasis:entry colname="col9">Soil types</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Haut-Katanga</oasis:entry>
         <oasis:entry colname="col2">119</oasis:entry>
         <oasis:entry colname="col3">27.48–27.85</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M247" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>11.61 to <inline-formula><mml:math id="M248" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>11.29</oasis:entry>
         <oasis:entry colname="col5">1197–1323</oasis:entry>
         <oasis:entry colname="col6">20.6</oasis:entry>
         <oasis:entry colname="col7">1223</oasis:entry>
         <oasis:entry colname="col8">Cwa</oasis:entry>
         <oasis:entry colname="col9">Rhodic/Haplic Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">South Kivu</oasis:entry>
         <oasis:entry colname="col2">369</oasis:entry>
         <oasis:entry colname="col3">28.64–28.91</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M249" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.79 to <inline-formula><mml:math id="M250" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.1</oasis:entry>
         <oasis:entry colname="col5">1487–2310</oasis:entry>
         <oasis:entry colname="col6">17.6</oasis:entry>
         <oasis:entry colname="col7">1627</oasis:entry>
         <oasis:entry colname="col8">Cfb, Csb, Aw, Cwb</oasis:entry>
         <oasis:entry colname="col9">Umbric Ferralsols, Haplic Acrisols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Tshopo</oasis:entry>
         <oasis:entry colname="col2">315</oasis:entry>
         <oasis:entry colname="col3">24.48–25.32</oasis:entry>
         <oasis:entry colname="col4">0.29–0.83</oasis:entry>
         <oasis:entry colname="col5">380–506</oasis:entry>
         <oasis:entry colname="col6">24.9</oasis:entry>
         <oasis:entry colname="col7">1789</oasis:entry>
         <oasis:entry colname="col8">Af</oasis:entry>
         <oasis:entry colname="col9">Xanthic/Haplic Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Tshuapa</oasis:entry>
         <oasis:entry colname="col2">738</oasis:entry>
         <oasis:entry colname="col3">21.84–22.53</oasis:entry>
         <oasis:entry colname="col4">0.28–0.8</oasis:entry>
         <oasis:entry colname="col5">385–578</oasis:entry>
         <oasis:entry colname="col6">24.7</oasis:entry>
         <oasis:entry colname="col7">2090</oasis:entry>
         <oasis:entry colname="col8">Af</oasis:entry>
         <oasis:entry colname="col9">Xanthic/Haplic Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Iburengerazuba</oasis:entry>
         <oasis:entry colname="col2">107</oasis:entry>
         <oasis:entry colname="col3">29.05–29.22</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M251" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.47 to <inline-formula><mml:math id="M252" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>2.34</oasis:entry>
         <oasis:entry colname="col5">1565–1939</oasis:entry>
         <oasis:entry colname="col6">17.6</oasis:entry>
         <oasis:entry colname="col7">1496</oasis:entry>
         <oasis:entry colname="col8">Csb, Aw, Cwb</oasis:entry>
         <oasis:entry colname="col9">Haplic/Umbric Acrisols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Kabarole</oasis:entry>
         <oasis:entry colname="col2">101</oasis:entry>
         <oasis:entry colname="col3">30.13–30.37</oasis:entry>
         <oasis:entry colname="col4">0.46–0.63</oasis:entry>
         <oasis:entry colname="col5">1271–1824</oasis:entry>
         <oasis:entry colname="col6">19.7</oasis:entry>
         <oasis:entry colname="col7">1360</oasis:entry>
         <oasis:entry colname="col8">Af, Cfb, Am</oasis:entry>
         <oasis:entry colname="col9">Haplic Phaeozems, Rhodic Nitisols, Albic Luvisols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Équateur</oasis:entry>
         <oasis:entry colname="col2">12</oasis:entry>
         <oasis:entry colname="col3">18.31</oasis:entry>
         <oasis:entry colname="col4">0.06</oasis:entry>
         <oasis:entry colname="col5">322</oasis:entry>
         <oasis:entry colname="col6">25.5</oasis:entry>
         <oasis:entry colname="col7">1685</oasis:entry>
         <oasis:entry colname="col8">Af</oasis:entry>
         <oasis:entry colname="col9">Eutric Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Bas-Uélé</oasis:entry>
         <oasis:entry colname="col2">49</oasis:entry>
         <oasis:entry colname="col3">24.75</oasis:entry>
         <oasis:entry colname="col4">2.8</oasis:entry>
         <oasis:entry colname="col5">423</oasis:entry>
         <oasis:entry colname="col6">25.2</oasis:entry>
         <oasis:entry colname="col7">1641</oasis:entry>
         <oasis:entry colname="col8">Aw</oasis:entry>
         <oasis:entry colname="col9">Haplic Ferralsols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">North Kivu</oasis:entry>
         <oasis:entry colname="col2">4</oasis:entry>
         <oasis:entry colname="col3">29.25–29.27</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M253" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>1.55 to <inline-formula><mml:math id="M254" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>1.53</oasis:entry>
         <oasis:entry colname="col5">2276–3250</oasis:entry>
         <oasis:entry colname="col6">12.8</oasis:entry>
         <oasis:entry colname="col7">1834</oasis:entry>
         <oasis:entry colname="col8">Cfb</oasis:entry>
         <oasis:entry colname="col9">Umbric Silandic Andosols</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Kongo Central</oasis:entry>
         <oasis:entry colname="col2">40</oasis:entry>
         <oasis:entry colname="col3">12.89–14.63</oasis:entry>
         <oasis:entry colname="col4"><inline-formula><mml:math id="M255" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>5.88 to <inline-formula><mml:math id="M256" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>4.71</oasis:entry>
         <oasis:entry colname="col5">30–470</oasis:entry>
         <oasis:entry colname="col6">25.5</oasis:entry>
         <oasis:entry colname="col7">1088</oasis:entry>
         <oasis:entry colname="col8">Aw</oasis:entry>
         <oasis:entry colname="col9">Ferralic Cambisols, Haplic Acrisols,</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
         <oasis:entry colname="col6"/>
         <oasis:entry colname="col7"/>
         <oasis:entry colname="col8"/>
         <oasis:entry colname="col9">Umbric Nitisols, Xanthic Ferralsols, Mollic Gleysols</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup><?xmltex \end{scaleboxenv}?></oasis:table></table-wrap>

<?xmltex \hack{\clearpage}?><?xmltex \floatpos{h!}?><table-wrap id="App1.Ch1.S1.T5"><?xmltex \hack{\hsize\textwidth}?><?xmltex \currentcnt{A2}?><label>Table A2</label><caption><p id="d1e6167"> Summary of the reference data for total carbon (TC) and total nitrogen (TN) of the two soil spectral libraries for central Africa (CSSL) and for continental sub-Saharan Africa (AfSIS SSL).</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="12">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right" colsep="1"/>
     <oasis:colspec colnum="8" colname="col8" align="right"/>
     <oasis:colspec colnum="9" colname="col9" align="right"/>
     <oasis:colspec colnum="10" colname="col10" align="right"/>
     <oasis:colspec colnum="11" colname="col11" align="right"/>
     <oasis:colspec colnum="12" colname="col12" align="right"/>
     <oasis:thead>
       <oasis:row>

         <oasis:entry colname="col1">SSL</oasis:entry>

         <oasis:entry colname="col2">Region covered</oasis:entry>

         <oasis:entry rowsep="1" namest="col3" nameend="col7" align="center" colsep="1">TC (<inline-formula><mml:math id="M257" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>) </oasis:entry>

         <oasis:entry rowsep="1" namest="col8" nameend="col12" align="center">TN (<inline-formula><mml:math id="M258" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">g</mml:mi><mml:mspace linebreak="nobreak" width="0.125em"/><mml:msup><mml:mi mathvariant="normal">kg</mml:mi><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>) </oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col1"/>

         <oasis:entry colname="col2"/>

         <oasis:entry colname="col3"><inline-formula><mml:math id="M259" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col4">Mean</oasis:entry>

         <oasis:entry colname="col5">Median</oasis:entry>

         <oasis:entry colname="col6">Min</oasis:entry>

         <oasis:entry colname="col7">Max</oasis:entry>

         <oasis:entry colname="col8"><inline-formula><mml:math id="M260" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula></oasis:entry>

         <oasis:entry colname="col9">Mean</oasis:entry>

         <oasis:entry colname="col10">Median</oasis:entry>

         <oasis:entry colname="col11">Min</oasis:entry>

         <oasis:entry colname="col12">Max</oasis:entry>

       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>

         <oasis:entry rowsep="1" colname="col1" morerows="9">CSSL</oasis:entry>

         <oasis:entry colname="col2">Haut-Katanga</oasis:entry>

         <oasis:entry colname="col3">119</oasis:entry>

         <oasis:entry colname="col4">11.31</oasis:entry>

         <oasis:entry colname="col5">9.66</oasis:entry>

         <oasis:entry colname="col6">1.26</oasis:entry>

         <oasis:entry colname="col7">34.66</oasis:entry>

         <oasis:entry colname="col8">119</oasis:entry>

         <oasis:entry colname="col9">1.10</oasis:entry>

         <oasis:entry colname="col10">1.04</oasis:entry>

         <oasis:entry colname="col11">0.44</oasis:entry>

         <oasis:entry colname="col12">2.92</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">South Kivu</oasis:entry>

         <oasis:entry colname="col3">367</oasis:entry>

         <oasis:entry colname="col4">35.37</oasis:entry>

         <oasis:entry colname="col5">29.28</oasis:entry>

         <oasis:entry colname="col6">5.98</oasis:entry>

         <oasis:entry colname="col7">182.10</oasis:entry>

         <oasis:entry colname="col8">368</oasis:entry>

         <oasis:entry colname="col9">3.06</oasis:entry>

         <oasis:entry colname="col10">2.40</oasis:entry>

         <oasis:entry colname="col11">0.68</oasis:entry>

         <oasis:entry colname="col12">15.02</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshopo</oasis:entry>

         <oasis:entry colname="col3">134</oasis:entry>

         <oasis:entry colname="col4">13.84</oasis:entry>

         <oasis:entry colname="col5">12.37</oasis:entry>

         <oasis:entry colname="col6">4.00</oasis:entry>

         <oasis:entry colname="col7">56.69</oasis:entry>

         <oasis:entry colname="col8">149</oasis:entry>

         <oasis:entry colname="col9">1.02</oasis:entry>

         <oasis:entry colname="col10">0.90</oasis:entry>

         <oasis:entry colname="col11">0.20</oasis:entry>

         <oasis:entry colname="col12">4.46</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Tshuapa</oasis:entry>

         <oasis:entry colname="col3">738</oasis:entry>

         <oasis:entry colname="col4">12.64</oasis:entry>

         <oasis:entry colname="col5">11.64</oasis:entry>

         <oasis:entry colname="col6">3.71</oasis:entry>

         <oasis:entry colname="col7">47.42</oasis:entry>

         <oasis:entry colname="col8">738</oasis:entry>

         <oasis:entry colname="col9">0.95</oasis:entry>

         <oasis:entry colname="col10">0.87</oasis:entry>

         <oasis:entry colname="col11">0.17</oasis:entry>

         <oasis:entry colname="col12">3.94</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Iburengerazuba</oasis:entry>

         <oasis:entry colname="col3">104</oasis:entry>

         <oasis:entry colname="col4">26.31</oasis:entry>

         <oasis:entry colname="col5">22.69</oasis:entry>

         <oasis:entry colname="col6">1.49</oasis:entry>

         <oasis:entry colname="col7">93.85</oasis:entry>

         <oasis:entry colname="col8">104</oasis:entry>

         <oasis:entry colname="col9">1.73</oasis:entry>

         <oasis:entry colname="col10">1.54</oasis:entry>

         <oasis:entry colname="col11">0.11</oasis:entry>

         <oasis:entry colname="col12">5.48</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Kabarole</oasis:entry>

         <oasis:entry colname="col3">100</oasis:entry>

         <oasis:entry colname="col4">17.69</oasis:entry>

         <oasis:entry colname="col5">11.95</oasis:entry>

         <oasis:entry colname="col6">0.77</oasis:entry>

         <oasis:entry colname="col7">53.76</oasis:entry>

         <oasis:entry colname="col8">100</oasis:entry>

         <oasis:entry colname="col9">1.68</oasis:entry>

         <oasis:entry colname="col10">1.21</oasis:entry>

         <oasis:entry colname="col11">0.11</oasis:entry>

         <oasis:entry colname="col12">5.05</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Équateur</oasis:entry>

         <oasis:entry colname="col3">12</oasis:entry>

         <oasis:entry colname="col4">13.17</oasis:entry>

         <oasis:entry colname="col5">10.19</oasis:entry>

         <oasis:entry colname="col6">1.24</oasis:entry>

         <oasis:entry colname="col7">50.53</oasis:entry>

         <oasis:entry colname="col8">12</oasis:entry>

         <oasis:entry colname="col9">0.75</oasis:entry>

         <oasis:entry colname="col10">0.75</oasis:entry>

         <oasis:entry colname="col11">0.23</oasis:entry>

         <oasis:entry colname="col12">1.37</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">Bas-Uélé</oasis:entry>

         <oasis:entry colname="col3">49</oasis:entry>

         <oasis:entry colname="col4">10.93</oasis:entry>

         <oasis:entry colname="col5">9.64</oasis:entry>

         <oasis:entry colname="col6">2.73</oasis:entry>

         <oasis:entry colname="col7">28.37</oasis:entry>

         <oasis:entry colname="col8">49</oasis:entry>

         <oasis:entry colname="col9">0.87</oasis:entry>

         <oasis:entry colname="col10">0.73</oasis:entry>

         <oasis:entry colname="col11">0.24</oasis:entry>

         <oasis:entry colname="col12">2.25</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col2">North Kivu</oasis:entry>

         <oasis:entry colname="col3">4</oasis:entry>

         <oasis:entry colname="col4">310.16</oasis:entry>

         <oasis:entry colname="col5">319.67</oasis:entry>

         <oasis:entry colname="col6">189.65</oasis:entry>

         <oasis:entry colname="col7">411.65</oasis:entry>

         <oasis:entry colname="col8">4</oasis:entry>

         <oasis:entry colname="col9">19.32</oasis:entry>

         <oasis:entry colname="col10">18.04</oasis:entry>

         <oasis:entry colname="col11">11.96</oasis:entry>

         <oasis:entry colname="col12">29.24</oasis:entry>

       </oasis:row>
       <oasis:row rowsep="1">

         <oasis:entry colname="col2">Kongo Central</oasis:entry>

         <oasis:entry colname="col3">40</oasis:entry>

         <oasis:entry colname="col4">16.78</oasis:entry>

         <oasis:entry colname="col5">12.41</oasis:entry>

         <oasis:entry colname="col6">3.36</oasis:entry>

         <oasis:entry colname="col7">54.96</oasis:entry>

         <oasis:entry colname="col8">40</oasis:entry>

         <oasis:entry colname="col9">1.38</oasis:entry>

         <oasis:entry colname="col10">1.18</oasis:entry>

         <oasis:entry colname="col11">0.44</oasis:entry>

         <oasis:entry colname="col12">4.88</oasis:entry>

       </oasis:row>
       <oasis:row>

         <oasis:entry colname="col1">AfSIS SSL</oasis:entry>

         <oasis:entry colname="col2">Sub-Saharan Africa</oasis:entry>

         <oasis:entry colname="col3">1902</oasis:entry>

         <oasis:entry colname="col4">12.37</oasis:entry>

         <oasis:entry colname="col5">7.82</oasis:entry>

         <oasis:entry colname="col6">0.84</oasis:entry>

         <oasis:entry colname="col7">112.88</oasis:entry>

         <oasis:entry colname="col8">1902</oasis:entry>

         <oasis:entry colname="col9">0.82</oasis:entry>

         <oasis:entry colname="col10">0.53</oasis:entry>

         <oasis:entry colname="col11">0.04</oasis:entry>

         <oasis:entry colname="col12">6.59</oasis:entry>

       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

<?xmltex \hack{\clearpage}?>
</app>
  </app-group><notes notes-type="codedataavailability"><title>Code and data availability</title>

      <p id="d1e6727">Data and R codes are available on the GitHub repository laura-summerauer/ssl-central-africa (<ext-link xlink:href="https://doi.org/10.5281/zenodo.4351254" ext-link-type="DOI">10.5281/zenodo.4351254</ext-link>,  <xref ref-type="bibr" rid="bib1.bibx75" id="altparen.80"/>).</p>
  </notes><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d1e6739">JS conceived the study. LS, PB, and LRL were the main contributors to the conceptualization, methodology (modeling strategies), and data analyses. MBar supported the conceptualization and provided technical support and project coordination. PB, LRL, SD, MBar, MBau, and JS helped with the writing of the paper. LS, MBau, BB, MR, PB, EK, KVO, BV, DC, ABH, PM, AS, KS, BBM, EVR, GB, and SD substantially contributed to the work by organizing, preparing, and providing soil samples and the corresponding reference data. All co-authors revised the paper.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d1e6745">The authors declare that they have no conflict of interest.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d1e6751">Publisher’s note: Copernicus Publications remains neutral with regard to jurisdictional claims in published maps and institutional affiliations.</p>
  </notes><notes notes-type="sistatement"><title>Special issue statement</title>

      <p id="d1e6757">This article is part of the special issue “Tropical biogeochemistry of soils in the Congo Basin and the African Great Lakes region”. It is not associated with a conference.</p>
  </notes><ack><title>Acknowledgements</title><p id="d1e6763">We are truly grateful to all collaborators in the Democratic Republic of Congo, in Rwanda, and in Uganda, who made this study possible and helped us with the organization and coordination of numerous field campaigns. We would like to express our gratitude to all the farmers and their families for their hospitality and help during the soil sampling. We would like to warmly thank the teams of the International Institute of Tropical Agriculture (IITA) in Bukavu (Kalambo), in Kinshasa, and in Nairobi, the World Agroforestry Centre (ICRAF) in Nairobi, the University of Lubumbashi, the Catholic University of Bukavu, the Mountains of the Moon University, Fort Portal, and the African Wildlife Foundation (AWF) in Kinshasa for their support and generosity. Moreover, we acknowledge the German Research Foundation (DFG, Deutsche Forschungsgemeinschaft) for their funding for the TropSOC project. Additionally, we would like to acknowledge the Walter Hochstrasser Foundation for their generous financial support of a unique master's thesis for 6 months in Djolu, the province of Tshuapa. Thanks are also expressed to Heather Maclean and Travis Drake, for the additional editing of the manuscript. Finally, we would like to thank the handling editors of <italic>SOIL</italic> and two anonymous reviewers for their valuable comments and insights that helped us to improve the manuscript and guided us during the review process.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d1e6771">This study was funded by core ETH funding provided to the Sustainable Agroecosystems Group and the Soil Resources Group from ETH Zurich.</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d1e6777">This paper was edited by Stefan Hauser and reviewed by two anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bibx1"><?xmltex \def\ref@label{{Angelopoulou et~al.(2020)Angelopoulou, Balafoutis, Zalidis, and
Bochtis}}?><label>Angelopoulou et al.(2020)Angelopoulou, Balafoutis, Zalidis, and
Bochtis</label><?label angelopoulouLaboratoryProximalSensing2020?><mixed-citation>Angelopoulou, T., Balafoutis, A., Zalidis, G., and Bochtis, D.: From
Laboratory to Proximal Sensing Spectroscopy for Soil Organic Carbon
Estimation – A Review, Sustainability, 12, 1–24,
<ext-link xlink:href="https://doi.org/10.3390/su12020443" ext-link-type="DOI">10.3390/su12020443</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx2"><?xmltex \def\ref@label{{Baert(1995)}}?><label>Baert(1995)</label><?label baertPropertiesChemicalManagement1995?><mixed-citation>
Baert, G.: Properties and Chemical Management Aspects of Soils on Different
Parent Rocks in the Lower Zaire, Doctoral thesis, Ghent University,
Ghent, Belgium, 1995.</mixed-citation></ref>
      <ref id="bib1.bibx3"><?xmltex \def\ref@label{{Baert et~al.(2009)Baert, Van~Ranst, Ngongo, Kasongo, Verdoodt,
Mujinya, and Mukalay}}?><label>Baert et al.(2009)Baert, Van Ranst, Ngongo, Kasongo, Verdoodt,
Mujinya, and Mukalay</label><?label baertGuideSolsCongo2009?><mixed-citation>
Baert, G., Van Ranst, E., Ngongo, M., Kasongo, E., Verdoodt, A., Mujinya, B.,
and Mukalay, J.: Guide Des Sols En R.D. Congo. Tome II:
Description et Données Physico-Chimiques de Profils Types.,
Imprimé par l'Ecole Technique Salama, Lubumbashi, R.D. Congo, 2009.</mixed-citation></ref>
      <ref id="bib1.bibx4"><?xmltex \def\ref@label{{Baert et~al.(2013)Baert, Van~Ranst, Ngongo, and
Verdoodt}}?><label>Baert et al.(2013)Baert, Van Ranst, Ngongo, and
Verdoodt</label><?label baertSoilSurveyDR2013?><mixed-citation>
Baert, G., Van Ranst, E., Ngongo, M., and Verdoodt, A.: Soil Survey in DR
Congo  –  from 1935 until Today, Meded. Zitt. K. Acad. overzeese
Wet, 59, 345–362, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx5"><?xmltex \def\ref@label{{Ballabio and
Consonni(2013)}}?><label>Ballabio and
Consonni(2013)</label><?label ballabioClassificationToolsChemistry2013?><mixed-citation>Ballabio, D. and Consonni, V.: Classification Tools in Chemistry. Part 1:
Linear Models, PLS-DA, Analytical Methods, 5, 3790–3798,
<ext-link xlink:href="https://doi.org/10.1039/c3ay40582f" ext-link-type="DOI">10.1039/c3ay40582f</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx6"><?xmltex \def\ref@label{{Barth{\`{e}}s et~al.(2020)Barth{\`{e}}s, Kouakoua, Coll, Clairotte,
Moulin, Saby, Le~Cadre, Etayo, and
Chevallier}}?><label>Barthès et al.(2020)Barthès, Kouakoua, Coll, Clairotte,
Moulin, Saby, Le Cadre, Etayo, and
Chevallier</label><?label barthesImprovementSpectralLibrarybased2020?><mixed-citation>Barthès, B. G., Kouakoua, E., Coll, P., Clairotte, M., Moulin, P., Saby,
N. P., Le Cadre, E., Etayo, A., and Chevallier, T.: Improvement in Spectral
Library-Based Quantification of Soil Properties Using Representative Spiking
and Local Calibration  –  The Case of Soil Inorganic Carbon
Prediction by Mid-Infrared Spectroscopy, Geoderma, 369, 114272,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2020.114272" ext-link-type="DOI">10.1016/j.geoderma.2020.114272</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx7"><?xmltex \def\ref@label{{Baumann(2020)}}?><label>Baumann(2020)</label><?label R-simplerspec?><mixed-citation>
Baumann, P.: Simplerspec: Soil and Plant Spectroscopic Model Building and
Prediction, r package version 0.1.0.9001, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx8"><?xmltex \def\ref@label{{Baumgartner et~al.(2020)Baumgartner, Barthel, Drake, Bauters,
Makelele, Mugula, Summerauer, Gallarotti, Cizungu~Ntaboba, Van~Oost, Boeckx,
Doetterl, Werner, and Six}}?><label>Baumgartner et al.(2020)Baumgartner, Barthel, Drake, Bauters,
Makelele, Mugula, Summerauer, Gallarotti, Cizungu Ntaboba, Van Oost, Boeckx,
Doetterl, Werner, and Six</label><?label baumgartnerSeasonalityDriversIsotopic2020?><mixed-citation>Baumgartner, S., Barthel, M., Drake, T. W., Bauters, M., Makelele, I. A., Mugula, J. K., Summerauer, L., Gallarotti, N., Cizungu Ntaboba, L., Van Oost, K., Boeckx, P., Doetterl, S., Werner, R. A., and Six, J.: Seasonality, drivers, and isotopic composition of soil <inline-formula><mml:math id="M261" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">CO</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> fluxes from tropical forests of the Congo Basin, Biogeosciences, 17, 6207–6218, <ext-link xlink:href="https://doi.org/10.5194/bg-17-6207-2020" ext-link-type="DOI">10.5194/bg-17-6207-2020</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx9"><?xmltex \def\ref@label{{Bauters et~al.(2015)Bauters, Ampoorter, Huygens, Kearsley,
De~Haulleville, Sellan, Verbeeck, Boeckx, and
Verheyen}}?><label>Bauters et al.(2015)Bauters, Ampoorter, Huygens, Kearsley,
De Haulleville, Sellan, Verbeeck, Boeckx, and
Verheyen</label><?label bautersFunctionalIdentityExplains2015?><mixed-citation>Bauters, M., Ampoorter, E., Huygens, D., Kearsley, E., De Haulleville, T.,
Sellan, G., Verbeeck, H., Boeckx, P., and Verheyen, K.: Functional Identity
Explains Carbon Sequestration in a 77-Year-Old Experimental Tropical
Plantation, Ecosphere, 6, 198, <ext-link xlink:href="https://doi.org/10.1890/ES15-00342.1" ext-link-type="DOI">10.1890/ES15-00342.1</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx10"><?xmltex \def\ref@label{{Bauters et~al.(2017)Bauters, Verbeeck, Doetterl, Ampoorter, Baert,
Vermeir, Verheyen, and Boeckx}}?><label>Bauters et al.(2017)Bauters, Verbeeck, Doetterl, Ampoorter, Baert,
Vermeir, Verheyen, and Boeckx</label><?label bautersFunctionalCompositionTree2017?><mixed-citation>Bauters, M., Verbeeck, H., Doetterl, S., Ampoorter, E., Baert, G., Vermeir, P.,
Verheyen, K., and Boeckx, P.: Functional Composition of Tree
Communities Changed Topsoil Properties in an Old Experimental Tropical
Plantation, Ecosystems, 20, 861–871, <ext-link xlink:href="https://doi.org/10.1007/s10021-016-0081-0" ext-link-type="DOI">10.1007/s10021-016-0081-0</ext-link>,
2017.</mixed-citation></ref>
      <ref id="bib1.bibx11"><?xmltex \def\ref@label{{Bauters et~al.(2019{\natexlab{a}})Bauters, Verbeeck, R{\"{u}}tting,
Barthel, Bazirake~Mujinya, Bamba, Bod{\'{e}}, Boyemba, Bulonza, Carlsson,
Eriksson, Makelele, Six, Cizungu~Ntaboba, and
Boeckx}}?><label>Bauters et al.(2019a)Bauters, Verbeeck, Rütting,
Barthel, Bazirake Mujinya, Bamba, Bodé, Boyemba, Bulonza, Carlsson,
Eriksson, Makelele, Six, Cizungu Ntaboba, and
Boeckx</label><?label bautersContrastingNitrogenFluxes2019?><mixed-citation>Bauters, M., Verbeeck, H., Rütting, T., Barthel, M., Bazirake Mujinya, B.,
Bamba, F., Bodé, S., Boyemba, F., Bulonza, E., Carlsson, E., Eriksson,
L., Makelele, I., Six, J., Cizungu Ntaboba, L., and Boeckx, P.: Contrasting
Nitrogen Fluxes in African Tropical Forests of the Congo Basin,
Ecological Monographs, 89, 1–17, <ext-link xlink:href="https://doi.org/10.1002/ecm.1342" ext-link-type="DOI">10.1002/ecm.1342</ext-link>, 2019a.</mixed-citation></ref>
      <?pagebreak page713?><ref id="bib1.bibx12"><?xmltex \def\ref@label{{Bauters et~al.(2019{\natexlab{b}})Bauters, Vercleyen, Vanlauwe, Six,
Bonyoma, Badjoko, Hubau, Hoyt, Boudin, Verbeeck, and
Boeckx}}?><label>Bauters et al.(2019b)Bauters, Vercleyen, Vanlauwe, Six,
Bonyoma, Badjoko, Hubau, Hoyt, Boudin, Verbeeck, and
Boeckx</label><?label bautersLongTermRecovery2019?><mixed-citation>Bauters, M., Vercleyen, O., Vanlauwe, B., Six, J., Bonyoma, B., Badjoko, H.,
Hubau, W., Hoyt, A., Boudin, M., Verbeeck, H., and Boeckx, P.: Long-term
Recovery of the Functional Community Assembly and Carbon Pools in an
African Tropical Forest Succession, Biotropica, 51, 319–329,
<ext-link xlink:href="https://doi.org/10.1111/btp.12647" ext-link-type="DOI">10.1111/btp.12647</ext-link>, 2019b.</mixed-citation></ref>
      <ref id="bib1.bibx13"><?xmltex \def\ref@label{{Bauters et~al.(2021)Bauters, Moonen, Summerauer, Doetterl, Wasner,
Griepentrog, Mumbanza, Kearsley, Ewango, Boyemba, Six, Muys, Verbist, Boeckx,
and Verheyen}}?><label>Bauters et al.(2021)Bauters, Moonen, Summerauer, Doetterl, Wasner,
Griepentrog, Mumbanza, Kearsley, Ewango, Boyemba, Six, Muys, Verbist, Boeckx,
and Verheyen</label><?label bautersSoilNutrientDepletion2021?><mixed-citation>Bauters, M., Moonen, P., Summerauer, L., Doetterl, S., Wasner, D., Griepentrog,
M., Mumbanza, F. M., Kearsley, E., Ewango, C., Boyemba, F., Six, J., Muys,
B., Verbist, B., Boeckx, P., and Verheyen, K.: Soil Nutrient Depletion
and Tree Functional Composition Shift Following Repeated Clearing in
Secondary Forests of the Congo Basin, Ecosystems, 24, 1422–1435,
<ext-link xlink:href="https://doi.org/10.1007/s10021-020-00593-6" ext-link-type="DOI">10.1007/s10021-020-00593-6</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx14"><?xmltex \def\ref@label{{Beck et~al.(2018)Beck, Zimmermann, McVicar, Vergopolan, Berg, and
Wood}}?><label>Beck et al.(2018)Beck, Zimmermann, McVicar, Vergopolan, Berg, and
Wood</label><?label beckPresentFutureKoppenGeiger2018?><mixed-citation>Beck, H. E., Zimmermann, N. E., McVicar, T. R., Vergopolan, N., Berg, A., and
Wood, E. F.: Present and Future Köppen-Geiger Climate
Classification Maps at 1-Km Resolution, Sci. Data, 5, 1–12,
<ext-link xlink:href="https://doi.org/10.1038/sdata.2018.214" ext-link-type="DOI">10.1038/sdata.2018.214</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx15"><?xmltex \def\ref@label{{{Bellon-Maurel} et~al.(2010){Bellon-Maurel}, {Fernandez-Ahumada},
Palagos, Roger, and McBratney}}?><label>Bellon-Maurel et al.(2010)Bellon-Maurel, Fernandez-Ahumada,
Palagos, Roger, and McBratney</label><?label bellon-maurelCriticalReviewChemometric2010?><mixed-citation>Bellon-Maurel, V., Fernandez-Ahumada, E., Palagos, B., Roger, J.-M., and
McBratney, A.: Critical Review of Chemometric Indicators Commonly Used for
Assessing the Quality of the Prediction of Soil Attributes by NIR
Spectroscopy, TrAC Trends in Analytical Chemistry, 29, 1073–1081,
<ext-link xlink:href="https://doi.org/10.1016/j.trac.2010.05.006" ext-link-type="DOI">10.1016/j.trac.2010.05.006</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bibx16"><?xmltex \def\ref@label{{Birg{\'{e}} et~al.(2016)Birg{\'{e}}, Bevans, Allen, Angeler, Baer, and
Wall}}?><label>Birgé et al.(2016)Birgé, Bevans, Allen, Angeler, Baer, and
Wall</label><?label birgeAdaptiveManagementSoil2016?><mixed-citation>Birgé, H. E., Bevans, R. A., Allen, C. R., Angeler, D. G., Baer, S. G., and
Wall, D. H.: Adaptive Management for Soil Ecosystem Services, J. Environ. Manage., 183, 371–378, <ext-link xlink:href="https://doi.org/10.1016/j.jenvman.2016.06.024" ext-link-type="DOI">10.1016/j.jenvman.2016.06.024</ext-link>,
2016.</mixed-citation></ref>
      <ref id="bib1.bibx17"><?xmltex \def\ref@label{{Briedis et~al.(2020)Briedis, Baldock, {de Moraes S{\'{a}}}, {dos
Santos}, and Milori}}?><label>Briedis et al.(2020)Briedis, Baldock, de Moraes Sá, dos
Santos, and Milori</label><?label briedisStrategiesImprovePrediction2020?><mixed-citation>Briedis, C., Baldock, J., de Moraes Sá, J. C., dos Santos, J. B., and
Milori, D. M. B. P.: Strategies to Improve the Prediction of Bulk Soil and
Fraction Organic Carbon in Brazilian Samples by Using an Australian
National Mid-Infrared Spectral Library, Geoderma, 373, 1–13,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2020.114401" ext-link-type="DOI">10.1016/j.geoderma.2020.114401</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx18"><?xmltex \def\ref@label{{Clairotte et~al.(2016)Clairotte, Grinand, Kouakoua, Th{\'{e}}bault,
Saby, Bernoux, and Barth{\`{e}}s}}?><label>Clairotte et al.(2016)Clairotte, Grinand, Kouakoua, Thébault,
Saby, Bernoux, and Barthès</label><?label clairotteNationalCalibrationSoil2016?><mixed-citation>Clairotte, M., Grinand, C., Kouakoua, E., Thébault, A., Saby, N. P.,
Bernoux, M., and Barthès, B. G.: National Calibration of Soil Organic
Carbon Concentration Using Diffuse Infrared Reflectance Spectroscopy,
Geoderma, 276, 41–52, <ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2016.04.021" ext-link-type="DOI">10.1016/j.geoderma.2016.04.021</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bibx19"><?xmltex \def\ref@label{{Cox et~al.(2013)Cox, Pearson, Booth, Friedlingstein, Huntingford,
Jones, and Luke}}?><label>Cox et al.(2013)Cox, Pearson, Booth, Friedlingstein, Huntingford,
Jones, and Luke</label><?label coxSensitivityTropicalCarbon2013?><mixed-citation>Cox, P. M., Pearson, D., Booth, B. B., Friedlingstein, P., Huntingford, C.,
Jones, C. D., and Luke, C. M.: Sensitivity of Tropical Carbon to Climate
Change Constrained by Carbon Dioxide Variability, Nature, 494, 341–344,
<ext-link xlink:href="https://doi.org/10.1038/nature11882" ext-link-type="DOI">10.1038/nature11882</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx20"><?xmltex \def\ref@label{{Curtis et~al.(2018)Curtis, Slay, Harris, Tyukavina, and
Hansen}}?><label>Curtis et al.(2018)Curtis, Slay, Harris, Tyukavina, and
Hansen</label><?label curtisClassifyingDriversGlobal2018?><mixed-citation>Curtis, P. G., Slay, C. M., Harris, N. L., Tyukavina, A., and Hansen, M. C.:
Classifying Drivers of Global Forest Loss, Science, 361, 1108–1111,
<ext-link xlink:href="https://doi.org/10.1126/science.aau3445" ext-link-type="DOI">10.1126/science.aau3445</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx21"><?xmltex \def\ref@label{{Dangal et~al.(2019)Dangal, Sanderman, Wills, and
{Ramirez-Lopez}}}?><label>Dangal et al.(2019)Dangal, Sanderman, Wills, and
Ramirez-Lopez</label><?label dangalAccuratePrecisePrediction2019?><mixed-citation>Dangal, S., Sanderman, J., Wills, S., and Ramirez-Lopez, L.: Accurate and
Precise Prediction of Soil Properties from a Large Mid-Infrared
Spectral Library, Soil Systems, 3, 1–23, <ext-link xlink:href="https://doi.org/10.3390/soilsystems3010011" ext-link-type="DOI">10.3390/soilsystems3010011</ext-link>,
2019.</mixed-citation></ref>
      <ref id="bib1.bibx22"><?xmltex \def\ref@label{{Dematt{\^{e}} et~al.(2019)Dematt{\^{e}}, Dotto, Paiva, Sato, Dalmolin,
{de Ara{\'{u}}jo}, {da Silva}, Nanni, {ten Caten}, Noronha, Lacerda, {de
Ara{\'{u}}jo Filho}, Rizzo, Bellinaso, Francelino, Schaefer, Vicente, {dos
Santos}, {de S{\'{a}} Barretto Sampaio}, Menezes, {de Souza}, Abrah{\~{a}}o,
Coelho, Grego, Lani, Fernandes, Gon{\c{c}}alves, Silva, {de Menezes}, Curi,
Couto, {dos Anjos}, Ceddia, Pinheiro, Grunwald, Vasques, Marques~J{\'{u}}nior,
{da Silva}, Barreto, N{\'{o}}brega, {da Silva}, {de Souza}, Valladares, Viana,
{da Silva Terra}, {Hor{\'{a}}k-Terra}, Fiorio, {da Silva}, Frade~J{\'{u}}nior,
Lima, Alba, {de Souza Junior}, Brefin, Ruivo, Ferreira, Brait, Caetano,
Bringhenti, {de Sousa Mendes}, Safanelli, Guimar{\~{a}}es, Poppiel, {e Souza},
Quesada, and {do Couto}}}?><label>Demattê et al.(2019)Demattê, Dotto, Paiva, Sato, Dalmolin,
de Araújo, da Silva, Nanni, ten Caten, Noronha, Lacerda, de
Araújo Filho, Rizzo, Bellinaso, Francelino, Schaefer, Vicente, dos
Santos, de Sá Barretto Sampaio, Menezes, de Souza, Abrahão,
Coelho, Grego, Lani, Fernandes, Gonçalves, Silva, de Menezes, Curi,
Couto, dos Anjos, Ceddia, Pinheiro, Grunwald, Vasques, Marques Júnior,
da Silva, Barreto, Nóbrega, da Silva, de Souza, Valladares, Viana,
da Silva Terra, Horák-Terra, Fiorio, da Silva, Frade Júnior,
Lima, Alba, de Souza Junior, Brefin, Ruivo, Ferreira, Brait, Caetano,
Bringhenti, de Sousa Mendes, Safanelli, Guimarães, Poppiel, e Souza,
Quesada, and do Couto</label><?label dematteBrazilianSoilSpectral2019?><mixed-citation>Demattê, J. A. M., Dotto, A. C., Paiva, A. F. S., Sato, M. V., Dalmolin, R.
S. D., de Araújo, M. d. S. B., da Silva, E. B., Nanni, M. R., ten
Caten, A., Noronha, N. C., Lacerda, M. P. C., de Araújo Filho, J. C.,
Rizzo, R., Bellinaso, H., Francelino, M. R., Schaefer, C. E. G. R., Vicente,
L. E., dos Santos, U. J., de Sá Barretto Sampaio, E. V., Menezes, R.
S. C., de Souza, J. J. L. L., Abrahão, W. A. P., Coelho, R. M., Grego,
C. R., Lani, J. L., Fernandes, A. R., Gonçalves, D. A. M., Silva, S.
H. G., de Menezes, M. D., Curi, N., Couto, E. G., dos Anjos, L. H. C.,
Ceddia, M. B., Pinheiro, É. F. M., Grunwald, S., Vasques, G. M.,
Marques Júnior, J., da Silva, A. J., Barreto, M. C. d. V., Nóbrega,
G. N., da Silva, M. Z., de Souza, S. F., Valladares, G. S., Viana, J.
H. M., da Silva Terra, F., Horák-Terra, I., Fiorio, P. R., da
Silva, R. C., Frade Júnior, E. F., Lima, R. H. C., Alba, J. M. F., de
Souza Junior, V. S., Brefin, M. D. L. M. S., Ruivo, M. D. L. P., Ferreira,
T. O., Brait, M. A., Caetano, N. R., Bringhenti, I., de Sousa Mendes, W.,
Safanelli, J. L., Guimarães, C. C. B., Poppiel, R. R., e Souza, A. B.,
Quesada, C. A., and do Couto, H. T. Z.: The Brazilian Soil Spectral
Library (BSSL): A General View, Application and Challenges,
Geoderma, 354, 1–21, <ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2019.05.043" ext-link-type="DOI">10.1016/j.geoderma.2019.05.043</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx23"><?xmltex \def\ref@label{{Doetterl et~al.(2021)Doetterl, Asifiwe, Baert, Bamba, Bauters,
Boeckx, Bukombe, Cadisch, Cizungu, Cooper, Hoyt, Kabaseke, Kalbitz, Kidinda,
Maier, Mainka, Mayrock, Muhindo, Mujinya, Mukotanyi, Nabahungu, Reichenbach,
Rewald, Six, Stegmann, Summerauer, Unseld, Vanlauwe, Van~Oost, Verheyen,
Vogel, Wilken, and Fiener}}?><label>Doetterl et al.(2021)Doetterl, Asifiwe, Baert, Bamba, Bauters,
Boeckx, Bukombe, Cadisch, Cizungu, Cooper, Hoyt, Kabaseke, Kalbitz, Kidinda,
Maier, Mainka, Mayrock, Muhindo, Mujinya, Mukotanyi, Nabahungu, Reichenbach,
Rewald, Six, Stegmann, Summerauer, Unseld, Vanlauwe, Van Oost, Verheyen,
Vogel, Wilken, and Fiener</label><?label essd-2021-73?><mixed-citation>Doetterl, S., Asifiwe, R. K., Baert, G., Bamba, F., Bauters, M., Boeckx, P., Bukombe, B., Cadisch, G., Cooper, M., Cizungu, L. N., Hoyt, A., Kabaseke, C., Kalbitz, K., Kidinda, L., Maier, A., Mainka, M., Mayrock, J., Muhindo, D., Mujinya, B. B., Mukotanyi, S. M., Nabahungu, L., Reichenbach, M., Rewald, B., Six, J., Stegmann, A., Summerauer, L., Unseld, R., Vanlauwe, B., Van Oost, K., Verheyen, K., Vogel, C., Wilken, F., and Fiener, P.: Organic matter cycling along geochemical, geomorphic, and disturbance gradients in forest and cropland of the African Tropics – project TropSOC database version 1.0, Earth Syst. Sci. Data, 13, 4133–4153, <ext-link xlink:href="https://doi.org/10.5194/essd-13-4133-2021" ext-link-type="DOI">10.5194/essd-13-4133-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx24"><?xmltex \def\ref@label{{Don et~al.(2011)Don, Schumacher, and
Freibauer}}?><label>Don et al.(2011)Don, Schumacher, and
Freibauer</label><?label donImpactTropicalLanduse2011?><mixed-citation>Don, A., Schumacher, J., and Freibauer, A.: Impact of Tropical Land-Use Change
on Soil Organic Carbon Stocks – a Meta-Analysis: SOIL ORGANIC CARBON AND
LAND-USE CHANGE, Global Change Biol., 17, 1658–1670,
<ext-link xlink:href="https://doi.org/10.1111/j.1365-2486.2010.02336.x" ext-link-type="DOI">10.1111/j.1365-2486.2010.02336.x</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bibx25"><?xmltex \def\ref@label{{Fick and Hijmans(2017)}}?><label>Fick and Hijmans(2017)</label><?label fickWorldClimNewKm2017?><mixed-citation>Fick, S. E. and Hijmans, R. J.: WorldClim 2: New 1-km Spatial Resolution
Climate Surfaces for Global Land Areas, Int.  J. Clim.,
37, 4302–4315, <ext-link xlink:href="https://doi.org/10.1002/joc.5086" ext-link-type="DOI">10.1002/joc.5086</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx26"><?xmltex \def\ref@label{{Fortin et~al.(2016)Fortin, Dale, and
Ver~Hoef}}?><label>Fortin et al.(2016)Fortin, Dale, and
Ver Hoef</label><?label fortinSpatialAnalysisEcology2016?><mixed-citation>
Fortin, M.-J., Dale, M. R., and Ver Hoef, J. M.: Spatial Analysis in
Ecology, in: Wiley StatsRef: Statistics Reference Online, edited
by: Balakrishnan, N., Colton, T., Everitt, B., Piegorsch, W., Ruggeri, F., and
Teugels, J. L., John Wiley &amp; Sons, Ltd, Chichester, UK, 13 pp., 2016.</mixed-citation></ref>
      <ref id="bib1.bibx27"><?xmltex \def\ref@label{{Gallarotti et~al.(2021)Gallarotti, Barthel, Verhoeven, Pereira,
Bauters, Baumgartner, Drake, Boeckx, Mohn, Longepierre, Mugula, Makelele,
Ntaboba, and Six}}?><label>Gallarotti et al.(2021)Gallarotti, Barthel, Verhoeven, Pereira,
Bauters, Baumgartner, Drake, Boeckx, Mohn, Longepierre, Mugula, Makelele,
Ntaboba, and Six</label><?label gallarottiIndepthAnalysisN2O2021?><mixed-citation>Gallarotti, N., Barthel, M., Verhoeven, E., Pereira, E. I. P., Bauters, M.,
Baumgartner, S., Drake, T. W., Boeckx, P., Mohn, J., Longepierre, M., Mugula,
J. K., Makelele, I. A., Ntaboba, L. C., and Six, J.: In-Depth Analysis of
N2O Fluxes in Tropical Forest Soils of the Congo Basin Combining
Isotope and Functional Gene Analysis, International Society for Microbial
Ecology Journal, ISME J., <ext-link xlink:href="https://doi.org/10.1038/s41396-021-01004-x" ext-link-type="DOI">10.1038/s41396-021-01004-x</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx28"><?xmltex \def\ref@label{{Gomez et~al.(2020)Gomez, Chevallier, Moulin, Bouferra, Hmaidi,
Arrouays, Jolivet, and Barth{\`{e}}s}}?><label>Gomez et al.(2020)Gomez, Chevallier, Moulin, Bouferra, Hmaidi,
Arrouays, Jolivet, and Barthès</label><?label gomezPredictionSoilOrganic2020?><mixed-citation>Gomez, C., Chevallier, T., Moulin, P., Bouferra, I., Hmaidi, K., Arrouays, D.,
Jolivet, C., and Barthès, B. G.: Prediction of Soil Organic and Inorganic
Carbon Concentrations in Tunisian Samples by Mid-Infrared Reflectance
Spectroscopy Using a French National Library, Geoderma, 375, 1–14,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2020.114469" ext-link-type="DOI">10.1016/j.geoderma.2020.114469</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx29"><?xmltex \def\ref@label{{Goyens et~al.(2007)Goyens, Verdoodt, Van De~Wauw, Baert, Van~Engelen,
Dijkshoorn, and Van~Ranst}}?><label>Goyens et al.(2007)Goyens, Verdoodt, Van De Wauw, Baert, Van Engelen,
Dijkshoorn, and Van Ranst</label><?label goyensBaseDonneesNumeriques2007?><mixed-citation>
Goyens, C., Verdoodt, A., Van De Wauw, J., Baert, G., Van Engelen, V.,
Dijkshoorn, J., and Van Ranst, E.: Base de Données Numériques sur les
SOls et le TERrain (SOTER) de l'Afrique Centrale (RD Congo, Rwanda et
Burundi), Etude et Gestion des Sols, 14, 207–218, 2007.</mixed-citation></ref>
      <ref id="bib1.bibx30"><?xmltex \def\ref@label{{Guerrero et~al.(2010)Guerrero, Zornoza, G{\'{o}}mez, and
{Mataix-Beneyto}}}?><label>Guerrero et al.(2010)Guerrero, Zornoza, Gómez, and
Mataix-Beneyto</label><?label guerreroSpikingNIRRegional2010?><mixed-citation>Guerrero, C., Zornoza, R., Gómez, I., and Mataix-Beneyto, J.: Spiking of
NIR Regional Models Using Samples from Target Sites: Effect of Model
Size on Prediction Accuracy, Geoderma, 158, 66–77,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2009.12.021" ext-link-type="DOI">10.1016/j.geoderma.2009.12.021</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bibx31"><?xmltex \def\ref@label{{Guerrero et~al.(2014)Guerrero, Stenberg, Wetterlind, Viscarra~Rossel,
Maestre, Mouazen, Zornoza, {Ruiz-Sinoga}, and
Kuang}}?><label>Guerrero et al.(2014)Guerrero, Stenberg, Wetterlind, Viscarra Rossel,
Maestre, Mouazen, Zornoza, Ruiz-Sinoga, and
Kuang</label><?label guerreroAssessmentSoilOrganic2014?><mixed-citation>Guerrero, C., Sten<?pagebreak page714?>berg, B., Wetterlind, J., Viscarra Rossel, R. A., Maestre,
F. T., Mouazen, A. M., Zornoza, R., Ruiz-Sinoga, J. D., and Kuang, B.:
Assessment of Soil Organic Carbon at Local Scale with Spiked NIR
Calibrations: Effects of Selection and Extra-Weighting on the Spiking Subset,
Europ. J. Soil Sci., 65, 248–263, <ext-link xlink:href="https://doi.org/10.1111/ejss.12129" ext-link-type="DOI">10.1111/ejss.12129</ext-link>,
2014.</mixed-citation></ref>
      <ref id="bib1.bibx32"><?xmltex \def\ref@label{{Hansen et~al.(2013)Hansen, Potapov, Moore, Hancher, Turubanova,
Tyukavina, Thau, Stehman, Goetz, Loveland, Kommareddy, Egorov, Chini,
Justice, and Townshend}}?><label>Hansen et al.(2013)Hansen, Potapov, Moore, Hancher, Turubanova,
Tyukavina, Thau, Stehman, Goetz, Loveland, Kommareddy, Egorov, Chini,
Justice, and Townshend</label><?label hansenHighResolutionGlobalMaps2013?><mixed-citation>Hansen, M. C., Potapov, P. V., Moore, R., Hancher, M., Turubanova, S. A.,
Tyukavina, A., Thau, D., Stehman, S. V., Goetz, S. J., Loveland, T. R.,
Kommareddy, A., Egorov, A., Chini, L., Justice, C. O., and Townshend, J.
R. G.: High-Resolution Global Maps of 21st-Century Forest Cover
Change, Science, 342, 850–853, <ext-link xlink:href="https://doi.org/10.1126/science.1244693" ext-link-type="DOI">10.1126/science.1244693</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx33"><?xmltex \def\ref@label{{{Heri-Kazi}(2020)}}?><label>Heri-Kazi(2020)</label><?label heri-kaziCaracterisationEtatDegradation2020?><mixed-citation>
Heri-Kazi, A. B.: Caractérisation de l'état de dégradation des terres
par l'érosion hydrique dans le Sud-Kivu montagneux à l'Est de la R.D.
Congo, Thèse doctorale, Université Catholique de Louvain, Louvain La
Neuve, 279 pp., 2020.</mixed-citation></ref>
      <ref id="bib1.bibx34"><?xmltex \def\ref@label{{Imerzoukene and
Van~Ranst(2002)}}?><label>Imerzoukene and
Van Ranst(2002)</label><?label imerzoukeneBanqueDonneesPedologiques2002?><mixed-citation>
Imerzoukene, S. and Van Ranst, E.: Une Banque de Données Pédologiques et
Son S.I.G, Pour Une Nouvelle Politique Agricole Au Rwanda,
Meded. Zitt. K. Acad. overzeese Wet, 47, 299–325, 2002.</mixed-citation></ref>
      <ref id="bib1.bibx35"><?xmltex \def\ref@label{{{IUSS Working Group
WRB}(2015)}}?><label>IUSS Working Group
WRB(2015)</label><?label iussworkinggroupwrbInternationalSoilClassification2015?><mixed-citation>
IUSS Working Group WRB: International Soil Classification System for Naming
Soils and Creating Legends for Soil Maps, World Soil Resources Reports
No. 106, FAO, Rome, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx36"><?xmltex \def\ref@label{{Janik et~al.(1998)Janik, Merry, and
Skjemstad}}?><label>Janik et al.(1998)Janik, Merry, and
Skjemstad</label><?label janikCanMidInfrared1998?><mixed-citation>Janik, L. J., Merry, R. H., and Skjemstad, J. O.: Can Mid Infrared Diffuse
Reflectance Analysis Replace Soil Extractions?, Austr. J.  Exp. Agr., 38, 681–696, <ext-link xlink:href="https://doi.org/10.1071/EA97144" ext-link-type="DOI">10.1071/EA97144</ext-link>, 1998.</mixed-citation></ref>
      <ref id="bib1.bibx37"><?xmltex \def\ref@label{{Jarvis et~al.(2008)Jarvis, Reuter, Nelson, and
Guevara}}?><label>Jarvis et al.(2008)Jarvis, Reuter, Nelson, and
Guevara</label><?label jarvisHolefilledSeamlessSRTM2008?><mixed-citation>Jarvis, A., Reuter, H. I., Nelson, A., and Guevara, E.: Hole-Filled Seamless
SRTM Data V4, <uri>https://srtm.csi.cgiar.org</uri> (last access: 20 December 2020), 2008.</mixed-citation></ref>
      <ref id="bib1.bibx38"><?xmltex \def\ref@label{{Jones et~al.(2013)Jones, {Breuning-Madsen}, Brossard, Dampha,
Deckers, Dewitte, Hallett, Jones, Kilasara, Le~Roux, Micheli, Montanarella,
Spaargaren, Tahar, Thiombiano, Van~Ranst, Yemefack, and
Zougmore}}?><label>Jones et al.(2013)Jones, Breuning-Madsen, Brossard, Dampha,
Deckers, Dewitte, Hallett, Jones, Kilasara, Le Roux, Micheli, Montanarella,
Spaargaren, Tahar, Thiombiano, Van Ranst, Yemefack, and
Zougmore</label><?label jonesSoilAtlasAfrica2013?><mixed-citation>Jones, A., Breuning-Madsen, H., Brossard, M., Dampha, A., Deckers, J.,
Dewitte, O., Hallett, S., Jones, R., Kilasara, M., Le Roux, P., Micheli, E.,
Montanarella, L., Spaargaren, O., Tahar, G., Thiombiano, L., Van Ranst, E.,
Yemefack, M., and Zougmore, R.: Soil Atlas of Africa, European
Commission, Publication Office of the European Union, Luxembourg,
<ext-link xlink:href="https://doi.org/10.2788/52319" ext-link-type="DOI">10.2788/52319</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx39"><?xmltex \def\ref@label{{Kearsley et~al.(2013)Kearsley, {de Haulleville}, Hufkens, Kidimbu,
Toirambe, Baert, Huygens, Kebede, Defourny, Bogaert, Beeckman, Steppe,
Boeckx, and Verbeeck}}?><label>Kearsley et al.(2013)Kearsley, de Haulleville, Hufkens, Kidimbu,
Toirambe, Baert, Huygens, Kebede, Defourny, Bogaert, Beeckman, Steppe,
Boeckx, and Verbeeck</label><?label kearsleyConventionalTreeHeight2013?><mixed-citation>Kearsley, E., de Haulleville, T., Hufkens, K., Kidimbu, A., Toirambe, B.,
Baert, G., Huygens, D., Kebede, Y., Defourny, P., Bogaert, J., Beeckman, H.,
Steppe, K., Boeckx, P., and Verbeeck, H.: Conventional Tree Height – Diameter Relationships Significantly Overestimate Aboveground Carbon Stocks
in the Central Congo Basin, Nat. Commun., 4, 1–8,
<ext-link xlink:href="https://doi.org/10.1038/ncomms3269" ext-link-type="DOI">10.1038/ncomms3269</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx40"><?xmltex \def\ref@label{{Kearsley et~al.(2017)Kearsley, Verbeeck, Hufkens, {Van de Perre},
Doetterl, Baert, Beeckman, Boeckx, and
Huygens}}?><label>Kearsley et al.(2017)Kearsley, Verbeeck, Hufkens, Van de Perre,
Doetterl, Baert, Beeckman, Boeckx, and
Huygens</label><?label kearsleyFunctionalCommunityStructure2017?><mixed-citation>Kearsley, E., Verbeeck, H., Hufkens, K., Van de Perre, F., Doetterl, S.,
Baert, G., Beeckman, H., Boeckx, P., and Huygens, D.: Functional Community
Structure of African Monodominant <italic>Gilbertiodendron Dewevrei</italic> Forest Influenced by Local Environmental Filtering, Ecol.
Evol., 7, 295–304, <ext-link xlink:href="https://doi.org/10.1002/ece3.2589" ext-link-type="DOI">10.1002/ece3.2589</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx41"><?xmltex \def\ref@label{{Lobsey et~al.(2017)Lobsey, Viscarra~Rossel, Poudier, and
Hedley}}?><label>Lobsey et al.(2017)Lobsey, Viscarra Rossel, Poudier, and
Hedley</label><?label lobseyRsLocalData2017?><mixed-citation>Lobsey, R., C., Viscarra Rossel, R. A., Poudier, P., and Hedley, C. B.:
Rs-local Data-mines Information from Spectral Libraries to Improve Local
Calibrations, Europ. J. Soil Sci., 68, 840–852,
<ext-link xlink:href="https://doi.org/10.1111/ejss.12490" ext-link-type="DOI">10.1111/ejss.12490</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx42"><?xmltex \def\ref@label{{Minten(2017)}}?><label>Minten(2017)</label><?label mintenDevelopmentBusinessPlan2017?><mixed-citation>
Minten, K.: Development Of a Business Plan For Production And Export Of
Green Coffee Beans From The Equateur Province In The Democratic Republic Of
The Congo, Master thesis, Ghent University, Ghent, Belgium, 68 pp., 2017.</mixed-citation></ref>
      <ref id="bib1.bibx43"><?xmltex \def\ref@label{{Moonen et~al.(2019)Moonen, Verbist, Boyemba~Bosela, Norgrove,
Dondeyne, Van~Meerbeek, Kearsley, Verbeeck, Vermeir, Boeckx, and
Muys}}?><label>Moonen et al.(2019)Moonen, Verbist, Boyemba Bosela, Norgrove,
Dondeyne, Van Meerbeek, Kearsley, Verbeeck, Vermeir, Boeckx, and
Muys</label><?label moonenDisentanglingHowManagement2019?><mixed-citation>Moonen, P. C., Verbist, B., Boyemba Bosela, F., Norgrove, L., Dondeyne, S.,
Van Meerbeek, K., Kearsley, E., Verbeeck, H., Vermeir, P., Boeckx, P., and
Muys, B.: Disentangling How Management Affects Biomass Stock and Productivity
of Tropical Secondary Forests Fallows, Sci. Tot. Environ., 659,
101–114, <ext-link xlink:href="https://doi.org/10.1016/j.scitotenv.2018.12.138" ext-link-type="DOI">10.1016/j.scitotenv.2018.12.138</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx44"><?xmltex \def\ref@label{{Mujinya(2012)}}?><label>Mujinya(2012)</label><?label mujinyaEffectsMacrotermesTermites2012?><mixed-citation>
Mujinya, B. B.: Effects of Macrotermes Termites on the Mineralogical and
Electro-Chemical Properties of Ferralsol Materials in the Upper
Katanga (D.R. Congo), Doctoral thesis, Ghent University,
Ghent, Belgium, 190 pp., 2012.</mixed-citation></ref>
      <ref id="bib1.bibx45"><?xmltex \def\ref@label{{Mujinya et~al.(2010)Mujinya, Van~Ranst, Verdoodt, Baert, and
Ngongo}}?><label>Mujinya et al.(2010)Mujinya, Van Ranst, Verdoodt, Baert, and
Ngongo</label><?label mujinyaTermiteBioturbationEffects2010?><mixed-citation>Mujinya, B. B., Van Ranst, E., Verdoodt, A., Baert, G., and Ngongo, L.: Termite
Bioturbation Effects on Electro-Chemical Properties of Ferralsols in the
Upper Katanga (D.R. Congo), Geoderma, 158, 233–241,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2010.04.033" ext-link-type="DOI">10.1016/j.geoderma.2010.04.033</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bibx46"><?xmltex \def\ref@label{{Mujinya et~al.(2011)Mujinya, Mees, Boeckx, Bod{\'{e}}, Baert, Erens,
Delefortrie, Verdoodt, Ngongo, and
Van~Ranst}}?><label>Mujinya et al.(2011)Mujinya, Mees, Boeckx, Bodé, Baert, Erens,
Delefortrie, Verdoodt, Ngongo, and
Van Ranst</label><?label mujinyaOriginCarbonatesTermite2011?><mixed-citation>Mujinya, B. B., Mees, F., Boeckx, P., Bodé, S., Baert, G., Erens, H.,
Delefortrie, S., Verdoodt, A., Ngongo, M., and Van Ranst, E.: The Origin of
Carbonates in Termite Mounds of the Lubumbashi Area, D.R.
Congo, Geoderma, 165, 95–105, <ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2011.07.009" ext-link-type="DOI">10.1016/j.geoderma.2011.07.009</ext-link>,
2011.</mixed-citation></ref>
      <ref id="bib1.bibx47"><?xmltex \def\ref@label{{Mujinya et~al.(2013)Mujinya, Mees, Erens, Dumon, Baert, Boeckx,
Ngongo, and Van~Ranst}}?><label>Mujinya et al.(2013)Mujinya, Mees, Erens, Dumon, Baert, Boeckx,
Ngongo, and Van Ranst</label><?label mujinyaClayCompositionProperties2013?><mixed-citation>Mujinya, B. B., Mees, F., Erens, H., Dumon, M., Baert, G., Boeckx, P., Ngongo,
M., and Van Ranst, E.: Clay Composition and Properties in Termite Mounds of
the Lubumbashi Area, D.R. Congo, Geoderma, 192, 304–315,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2012.08.010" ext-link-type="DOI">10.1016/j.geoderma.2012.08.010</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx48"><?xmltex \def\ref@label{{Mujinya et~al.(2014)Mujinya, Adam, Mees, Bogaert, Vranken, Erens,
Baert, Ngongo, and Van~Ranst}}?><label>Mujinya et al.(2014)Mujinya, Adam, Mees, Bogaert, Vranken, Erens,
Baert, Ngongo, and Van Ranst</label><?label mujinyaSpatialPatternsMorphology2014?><mixed-citation>Mujinya, B. B., Adam, M., Mees, F., Bogaert, J., Vranken, I., Erens, H., Baert,
G., Ngongo, M., and Van Ranst, E.: Spatial Patterns and Morphology of Termite
(Macrotermes Falciger) Mounds in the Upper Katanga, D.R.
Congo, Catena, 114, 97–106, <ext-link xlink:href="https://doi.org/10.1016/j.catena.2013.10.015" ext-link-type="DOI">10.1016/j.catena.2013.10.015</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bibx49"><?xmltex \def\ref@label{{N{\ae}s(1987)}}?><label>Næs(1987)</label><?label naesDesignCalibrationInfrared1987?><mixed-citation>Næs, T.: The Design of Calibration in near Infra-Red Reflectance Analysis
by Clustering, J. Chemometr., 1, 121–134,
<ext-link xlink:href="https://doi.org/10.1002/cem.1180010207" ext-link-type="DOI">10.1002/cem.1180010207</ext-link>, 1987.</mixed-citation></ref>
      <ref id="bib1.bibx50"><?xmltex \def\ref@label{{Naes et~al.(1990)Naes, Isaksson, and
Kowalski}}?><label>Naes et al.(1990)Naes, Isaksson, and
Kowalski</label><?label naesLocallyWeightedRegression1990?><mixed-citation>Naes, T., Isaksson, T., and Kowalski, B.: Locally Weighted Regression and
Scatter Correction for Near-Infrared Reflectance Data, Anal. Chem.,
62, 664–673, <ext-link xlink:href="https://doi.org/10.1021/ac00206a003" ext-link-type="DOI">10.1021/ac00206a003</ext-link>, 1990.</mixed-citation></ref>
      <ref id="bib1.bibx51"><?xmltex \def\ref@label{{Ng et~al.(2019)Ng, Minasny, Montazerolghaem, Padarian, Ferguson,
Bailey, and McBratney}}?><label>Ng et al.(2019)Ng, Minasny, Montazerolghaem, Padarian, Ferguson,
Bailey, and McBratney</label><?label ngConvolutionalNeuralNetwork2019?><mixed-citation>Ng, W., Minasny, B., Montazerolghaem, M., Padarian, J., Ferguson, R., Bailey,
S., and McBratney, A. B.: Convolutional Neural Network for Simultaneous
Prediction of Several Soil Properties Using Visible/near-Infrared,
Mid-Infrared, and Their Combined Spectra, Geoderma, 352, 251–267,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2019.06.016" ext-link-type="DOI">10.1016/j.geoderma.2019.06.016</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx52"><?xmltex \def\ref@label{{Nocita et~al.(2014)Nocita, Stevens, Toth, Panagos, {van Wesemael},
and Montanarella}}?><label>Nocita et al.(2014)Nocita, Stevens, Toth, Panagos, van Wesemael,
and Montanarella</label><?label nocitaPredictionSoilOrganic2014?><mixed-citation>Nocita, M., Stevens, A., Toth, G., Panagos, P., van Wesemael, B., and
Montanarella, L.: Prediction of Soil Organic Carbon Content by Diffuse
Reflectance Spectroscopy Using a Local Partial Least Square Regression
Approach, Soil Biol. Biochem., 68, 337–347,
<ext-link xlink:href="https://doi.org/10.1016/j.soilbio.2013.10.022" ext-link-type="DOI">10.1016/j.soilbio.2013.10.022</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bibx53"><?xmltex \def\ref@label{{Nocita et~al.(2015)Nocita, Stevens, {van Wesemael}, Aitkenhead,
Bachmann, Barth{\`{e}}s, Ben~Dor, Brown, Clairotte, Csorba, Dardenne,
Dematt{\^{e}}, Genot, Guerrero, Knadel, Montanarella, Noon, {Ramirez-Lopez},
Robertson, Sakai, {Soriano-Disla}, Shepherd, Stenberg, Towett, Vargas, and
Wetterlind}}?><label>Nocita et al.(2015)Nocita, Stevens, van Wesemael, Aitkenhead,
Bachmann, Barthès, Ben Dor, Brown, Clairotte, Csorba, Dardenne,
Demattê, Genot, Guerrero, Knadel, Montanarella, Noon, Ramirez-Lopez,
Robertson, Sakai, Soriano-Disla, Shepherd, Stenberg, Towett, Vargas, and
Wetterlind</label><?label nocitaSoilSpectroscopyAlternative2015?><mixed-citation>Nocita, M., Stevens, A., van Wesemael, B., Aitkenhead, M., Bachmann, M.,
Barthès, B., Ben Dor, E., Brown, D. J., Clairotte, M., Csorba, A.,
Dardenne, P., Demattê, J. A., Genot, V., Guerrero, C., Knadel, M.,
Montanarella, L., Noon, C., Ramirez-Lopez, L., Robertson, J., Sakai, H.,
Soriano-Disla, J. M., Shepherd, K. D., Stenberg, B., Towett, E. K., Vargas,
R., and Wetterlind, J.: Soil Spectroscopy: An Alternative to Wet
Chemistry for Soil Monitoring, in: Advances in Agronomy, Vol. 132,
Elsevier, 139–159, <ext-link xlink:href="https://doi.org/10.1016/bs.agron.2015.02.002" ext-link-type="DOI">10.1016/bs.agron.2015.02.002</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx54"><?xmltex \def\ref@label{{Padarian et~al.(2019)Padarian, Minasny, and
McBratney}}?><label>Padarian et al.(2019)Padarian, Minasny, and
McBratney</label><?label padarianTransferLearningLocalise2019?><mixed-citation>Padarian, J., Minasny, B., and McBratney, A.: Transfer Learning to Localise a
Continental Soil Vis-NIR Calibration Model, Geoderma, 340, 279–288,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2019.01.009" ext-link-type="DOI">10.1016/j.geoderma.2019.01.009</ext-link>, 2019.</mixed-citation></ref>
      <?pagebreak page715?><ref id="bib1.bibx55"><?xmltex \def\ref@label{{{R Core Team}(2020)}}?><label>R Core Team(2020)</label><?label R-base?><mixed-citation>
R Core Team: R: A Language and Environment for Statistical Computing, R
Foundation for Statistical Computing, Vienna, Austria, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx56"><?xmltex \def\ref@label{{{Ramirez-Lopez}(2020)}}?><label>Ramirez-Lopez(2020)</label><?label R-resemble?><mixed-citation>
Ramirez-Lopez, L.: Resemble: Regression and Similarity Evaluation for
Memory-Based Learning in Spectral Chemometrics, r package version 2.1.1,
2020.</mixed-citation></ref>
      <ref id="bib1.bibx57"><?xmltex \def\ref@label{{{Ramirez-Lopez} et~al.(2013{\natexlab{a}}){Ramirez-Lopez}, Behrens,
Schmidt, Rossel, Dematt{\^{e}}, and
Scholten}}?><label>Ramirez-Lopez et al.(2013a)Ramirez-Lopez, Behrens,
Schmidt, Rossel, Demattê, and
Scholten</label><?label ramirez-lopezDistanceSimilaritysearchMetrics2013?><mixed-citation>Ramirez-Lopez, L., Behrens, T., Schmidt, K., Rossel, R. V., Demattê, J.,
and Scholten, T.: Distance and Similarity-Search Metrics for Use with Soil
Vis-NIR Spectra, Geoderma, 199, 43–53,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2012.08.035" ext-link-type="DOI">10.1016/j.geoderma.2012.08.035</ext-link>, 2013a.</mixed-citation></ref>
      <ref id="bib1.bibx58"><?xmltex \def\ref@label{{{Ramirez-Lopez} et~al.(2013{\natexlab{b}}){Ramirez-Lopez}, Behrens,
Schmidt, Stevens, Dematt{\^{e}}, and
Scholten}}?><label>Ramirez-Lopez et al.(2013b)Ramirez-Lopez, Behrens,
Schmidt, Stevens, Demattê, and
Scholten</label><?label ramirez-lopezSpectrumbasedLearnerNew2013?><mixed-citation>Ramirez-Lopez, L., Behrens, T., Schmidt, K., Stevens, A., Demattê, J.
A. M., and Scholten, T.: The Spectrum-Based Learner: A New Local Approach
for Modeling Soil Vis–NIR Spectra of Complex Datasets,
Geoderma, 195, 268–279, <ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2012.12.014" ext-link-type="DOI">10.1016/j.geoderma.2012.12.014</ext-link>,
2013b.</mixed-citation></ref>
      <ref id="bib1.bibx59"><?xmltex \def\ref@label{{{Ramirez-Lopez} et~al.(2014){Ramirez-Lopez}, Schmidt, Behrens, {van
Wesemael}, Dematt{\^{e}}, and
Scholten}}?><label>Ramirez-Lopez et al.(2014)Ramirez-Lopez, Schmidt, Behrens, van
Wesemael, Demattê, and
Scholten</label><?label ramirez-lopezSamplingOptimalCalibration2014?><mixed-citation>Ramirez-Lopez, L., Schmidt, K., Behrens, T., van Wesemael, B., Demattê,
J. A., and Scholten, T.: Sampling Optimal Calibration Sets in Soil Infrared
Spectroscopy, Geoderma, 226, 140–150, <ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2014.02.002" ext-link-type="DOI">10.1016/j.geoderma.2014.02.002</ext-link>,
2014.</mixed-citation></ref>
      <ref id="bib1.bibx60"><?xmltex \def\ref@label{{Ramirez-Lopez et~al.(2019)Ramirez-Lopez, Wadoux, Franceschini, Terra,
Marques, Say{\~{a}}o, and Dematt{\^{e}}}}?><label>Ramirez-Lopez et al.(2019)Ramirez-Lopez, Wadoux, Franceschini, Terra,
Marques, Sayão, and Demattê</label><?label ramirez-lopezRobustSoilMapping2019?><mixed-citation>Ramirez-Lopez, L., Wadoux, A. M. J.-C., Franceschini, M. H. D., Terra, F. S.,
Marques, K. P. P., Sayão, V. M., and Demattê, J. A. M.: Robust Soil
Mapping at the Farm Scale with Vis-NIR Spectroscopy, Europ.
J. Soil Sci., 70, 378–393, <ext-link xlink:href="https://doi.org/10.1111/ejss.12752" ext-link-type="DOI">10.1111/ejss.12752</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx61"><?xmltex \def\ref@label{{Rinnan(2014)}}?><label>Rinnan(2014)</label><?label rinnanPreprocessingVibrationalSpectroscopy2014?><mixed-citation>Rinnan, A.: Pre-Processing in Vibrational Spectroscopy  –  When, Why
and How, Anal. Meth., 6, 7124–7129, <ext-link xlink:href="https://doi.org/10.1039/C3AY42270D" ext-link-type="DOI">10.1039/C3AY42270D</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bibx62"><?xmltex \def\ref@label{{Sanderman et~al.(2020)Sanderman, Savage, and
Dangal}}?><label>Sanderman et al.(2020)Sanderman, Savage, and
Dangal</label><?label sandermanMidInfraredSpectroscopy2020?><mixed-citation>Sanderman, J., Savage, K., and Dangal, S. R.: Mid-infrared Spectroscopy for
Prediction of Soil Health Indicators in the United States, Soil Sci.
Soc. Am. J., 84, 251–261, <ext-link xlink:href="https://doi.org/10.1002/saj2.20009" ext-link-type="DOI">10.1002/saj2.20009</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx63"><?xmltex \def\ref@label{{Savitzky and Golay(1964)}}?><label>Savitzky and Golay(1964)</label><?label savitzkySmoothingDifferentiationData1964?><mixed-citation>Savitzky, A. and Golay, M. J. E.: Smoothing and Differentiation of Data
by Simplified Least Squares Procedures, Anal. Chem., 36,
1627–1639, <ext-link xlink:href="https://doi.org/10.1021/ac60214a047" ext-link-type="DOI">10.1021/ac60214a047</ext-link>, 1964.</mixed-citation></ref>
      <ref id="bib1.bibx64"><?xmltex \def\ref@label{{Seidel et~al.(2019)Seidel, Hutengs, Ludwig, {Thiele-Bruhn}, and
Vohland}}?><label>Seidel et al.(2019)Seidel, Hutengs, Ludwig, Thiele-Bruhn, and
Vohland</label><?label seidelStrategiesEfficientEstimation2019?><mixed-citation>Seidel, M., Hutengs, C., Ludwig, B., Thiele-Bruhn, S., and Vohland, M.:
Strategies for the Efficient Estimation of Soil Organic Carbon at the Field
Scale with Vis-NIR Spectroscopy: Spectral Libraries and Spiking vs.
Local Calibrations, Geoderma, 354, 1–13,
<ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2019.07.014" ext-link-type="DOI">10.1016/j.geoderma.2019.07.014</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx65"><?xmltex \def\ref@label{{Seybold et~al.(2019)Seybold, Ferguson, Wysocki, Bailey, Anderson,
Nester, Schoeneberger, Wills, Libohova, Hoover, and
Thomas}}?><label>Seybold et al.(2019)Seybold, Ferguson, Wysocki, Bailey, Anderson,
Nester, Schoeneberger, Wills, Libohova, Hoover, and
Thomas</label><?label seyboldApplicationMidInfraredSpectroscopy2019?><mixed-citation>Seybold, C. A., Ferguson, R., Wysocki, D., Bailey, S., Anderson, J., Nester,
B., Schoeneberger, P., Wills, S., Libohova, Z., Hoover, D., and Thomas, P.:
Application of Mid-Infrared Spectroscopy in Soil Survey, Soil
Sci. Soc. Am. J., 83, 1746–1759,
<ext-link xlink:href="https://doi.org/10.2136/sssaj2019.06.0205" ext-link-type="DOI">10.2136/sssaj2019.06.0205</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx66"><?xmltex \def\ref@label{{Shenk et~al.(1997)Shenk, Westerhaus, and
Berzaghi}}?><label>Shenk et al.(1997)Shenk, Westerhaus, and
Berzaghi</label><?label shenkInvestigationLOCALCalibration1997?><mixed-citation>Shenk, J. S., Westerhaus, M. O., and Berzaghi, P.: Investigation of a LOCAL
Calibration Procedure for near Infrared Instruments, Journal of Near
Infrared Spectroscopy, 5, 223–232, <ext-link xlink:href="https://doi.org/10.1255/jnirs.115" ext-link-type="DOI">10.1255/jnirs.115</ext-link>, 1997.</mixed-citation></ref>
      <ref id="bib1.bibx67"><?xmltex \def\ref@label{{Shepherd and Walsh(2007)}}?><label>Shepherd and Walsh(2007)</label><?label shepherdInfraredSpectroscopyEnabling2007?><mixed-citation>Shepherd, K. D. and Walsh, M. G.: Infrared
Spectroscopy – Enabling an Evidence-Based Diagnostic
Surveillance Approach to Agricultural and Environmental Management
in Developing Countries, Journal of Near Infrared Spectroscopy, 15,
1–19, <ext-link xlink:href="https://doi.org/10.1255/jnirs.716" ext-link-type="DOI">10.1255/jnirs.716</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bibx68"><?xmltex \def\ref@label{{Shi et~al.(2014)Shi, Wang, Peng, Ji, Liu, Li, and
Viscarra~Rossel}}?><label>Shi et al.(2014)Shi, Wang, Peng, Ji, Liu, Li, and
Viscarra Rossel</label><?label shiDevelopmentNationalVNIR2014?><mixed-citation>Shi, Z., Wang, Q., Peng, J., Ji, W., Liu, H., Li, X., and Viscarra Rossel,
R. A.: Development of a National VNIR Soil-Spectral Library for Soil
Classification and Prediction of Organic Matter Concentrations, Science China
Earth Sciences, 57, 1671–1680, <ext-link xlink:href="https://doi.org/10.1007/s11430-013-4808-x" ext-link-type="DOI">10.1007/s11430-013-4808-x</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bibx69"><?xmltex \def\ref@label{{Shi et~al.(2015)Shi, Ji, Viscarra~Rossel, Chen, and
Zhou}}?><label>Shi et al.(2015)Shi, Ji, Viscarra Rossel, Chen, and
Zhou</label><?label shiPredictionSoilOrganic2015?><mixed-citation>Shi, Z., Ji, W., Viscarra Rossel, R. A., Chen, S., and Zhou, Y.: Prediction of
Soil Organic Matter Using a Spatially Constrained Local Partial Least Squares
Regression and the Chinese Vis-NIR Spectral Library, Europ. J. Soil Sci., 66, 679–687, <ext-link xlink:href="https://doi.org/10.1111/ejss.12272" ext-link-type="DOI">10.1111/ejss.12272</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx70"><?xmltex \def\ref@label{{Sila et~al.(2016)Sila, Shepherd, and
Pokhariyal}}?><label>Sila et al.(2016)Sila, Shepherd, and
Pokhariyal</label><?label silaEvaluatingUtilityMidinfrared2016?><mixed-citation>Sila, A. M., Shepherd, K. D., and Pokhariyal, G. P.: Evaluating the Utility of
Mid-Infrared Spectral Subspaces for Predicting Soil Properties, Chemometrics
and Intelligent Laboratory Systems, 153, 92–105,
<ext-link xlink:href="https://doi.org/10.1016/j.chemolab.2016.02.013" ext-link-type="DOI">10.1016/j.chemolab.2016.02.013</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bibx71"><?xmltex \def\ref@label{{{Soriano-Disla} et~al.(2014){Soriano-Disla}, Janik, Viscarra~Rossel,
Macdonald, and McLaughlin}}?><label>Soriano-Disla et al.(2014)Soriano-Disla, Janik, Viscarra Rossel,
Macdonald, and McLaughlin</label><?label soriano-dislaPerformanceVisibleMidInfrared2014?><mixed-citation>Soriano-Disla, J. M., Janik, L. J., Viscarra Rossel, R. A., Macdonald, L. M.,
and McLaughlin, M. J.: The Performance of Visible, Near-, and
Mid-Infrared Reflectance Spectroscopy for Prediction of Soil
Physical, Chemical, and Biological Properties, Appl. Spec.  Rev., 49, 139–186, <ext-link xlink:href="https://doi.org/10.1080/05704928.2013.811081" ext-link-type="DOI">10.1080/05704928.2013.811081</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bibx72"><?xmltex \def\ref@label{{Stevens and {Ramirez-Lopez}(2020)}}?><label>Stevens and Ramirez-Lopez(2020)</label><?label R-prospectr?><mixed-citation>
Stevens, A. and Ramirez-Lopez, L.: Prospectr: Miscellaneous Functions for
Processing and Sample Selection of Spectroscopic Data, r package version
0.2.0, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx73"><?xmltex \def\ref@label{{Stevens et~al.(2013)Stevens, Nocita, T{\'{o}}th, Montanarella, and van
Wesemael}}?><label>Stevens et al.(2013)Stevens, Nocita, Tóth, Montanarella, and van
Wesemael</label><?label stevensPredictionSoilOrganic2013a?><mixed-citation>Stevens, A., Nocita, M., Tóth, G., Montanarella, L., and van Wesemael, B.:
Prediction of Soil Organic Carbon at the European Scale by
Visible and Near InfraRed Reflectance Spectroscopy, PLOS ONE, 8,
1–13, <ext-link xlink:href="https://doi.org/10.1371/journal.pone.0066409" ext-link-type="DOI">10.1371/journal.pone.0066409</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bibx74"><?xmltex \def\ref@label{{Summerauer(2017)}}?><label>Summerauer(2017)</label><?label summerauerSustainableAgriculturalIntensification2017?><mixed-citation>
Summerauer, L.: Sustainable Agricultural Intensification Methods of
Cassava Based Systems for Improving Livelihoods and Forest
Conservation in the Congo Basin, Master thesis, ETH Zurich, Zurich,
Switzerland, 60 pp., 2017.</mixed-citation></ref>
      <ref id="bib1.bibx75"><?xmltex \def\ref@label{{Summerauer(2020)}}?><label>Summerauer(2020)</label><?label summerauer2020?><mixed-citation>Summerauer, L.: laura-summerauer/ssl-central-africa: Codes and data for manuscript submission (submission version) (v.1.0), Zenodo [code], <ext-link xlink:href="https://doi.org/10.5281/zenodo.4351254" ext-link-type="DOI">10.5281/zenodo.4351254</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx76"><?xmltex \def\ref@label{{Tsakiridis et~al.(2019)Tsakiridis, Theocharis, Panagos, and
Zalidis}}?><label>Tsakiridis et al.(2019)Tsakiridis, Theocharis, Panagos, and
Zalidis</label><?label tsakiridisEvolutionaryFuzzyRulebased2019?><mixed-citation>Tsakiridis, N. L., Theocharis, J. B., Panagos, P., and Zalidis, G. C.: An
Evolutionary Fuzzy Rule-Based System Applied to the Prediction of Soil
Organic Carbon from Soil Spectral Libraries, Applied Soft Computing, 81,
1–18, <ext-link xlink:href="https://doi.org/10.1016/j.asoc.2019.105504" ext-link-type="DOI">10.1016/j.asoc.2019.105504</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx77"><?xmltex \def\ref@label{{Tyukavina et~al.(2018)Tyukavina, Hansen, Potapov, Parker, Okpa,
Stehman, Kommareddy, and Turubanova}}?><label>Tyukavina et al.(2018)Tyukavina, Hansen, Potapov, Parker, Okpa,
Stehman, Kommareddy, and Turubanova</label><?label tyukavinaCongoBasinForest2018?><mixed-citation>Tyukavina, A., Hansen, M. C., Potapov, P., Parker, D., Okpa, C., Stehman,
S. V., Kommareddy, I., and Turubanova, S.: Congo Basin Forest Loss
Dominated by Increasing Smallholder Clearing, Sci. Adv., 4, 1–12,
<ext-link xlink:href="https://doi.org/10.1126/sciadv.aat2993" ext-link-type="DOI">10.1126/sciadv.aat2993</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx78"><?xmltex \def\ref@label{{Tziolas et~al.(2019)Tziolas, Tsakiridis, {Ben-Dor}, Theocharis, and
Zalidis}}?><label>Tziolas et al.(2019)Tziolas, Tsakiridis, Ben-Dor, Theocharis, and
Zalidis</label><?label tziolasMemorybasedLearningApproach2019?><mixed-citation>Tziolas, N., Tsakiridis, N., Ben-Dor, E., Theocharis, J., and Zalidis, G.: A
Memory-Based Learning Approach Utilizing Combined Spectral Sources and
Geographical Proximity for Improved VIS-NIR-SWIR Soil Properties
Estimation, Geoderma, 340, 11–24, <ext-link xlink:href="https://doi.org/10.1016/j.geoderma.2018.12.044" ext-link-type="DOI">10.1016/j.geoderma.2018.12.044</ext-link>,
2019.</mixed-citation></ref>
      <ref id="bib1.bibx79"><?xmltex \def\ref@label{{V{\aa}gen et~al.(2020)V{\aa}gen, Winowiecki, Desta, Tondoh, Weullow,
Shepherd, and Sila}}?><label>Vågen et al.(2020)Vågen, Winowiecki, Desta, Tondoh, Weullow,
Shepherd, and Sila</label><?label vagenMidInfraredSpectraMIRS2020?><mixed-citation>Vågen, T.-G., Winowiecki, L. A., Desta, L., Tondoh, E. J., Weullow, E.,
Shepherd, K., and Sila, A.: Mid-Infrared Spectra (MIRS) from ICRAF
Soil and Plant Spectroscopy Laboratory: Africa Soil Information
Service (AfSIS) Phase I 2009-2013, World Agroforestry – Research
Data Repository, V1,  <ext-link xlink:href="https://doi.org/10.34725/DVN/QXCWP1" ext-link-type="DOI">10.34725/DVN/QXCWP1</ext-link>,
2020.</mixed-citation></ref>
      <ref id="bib1.bibx80"><?xmltex \def\ref@label{{Van~Ranst et~al.(2010)Van~Ranst, Verdoodt, and
Baert}}?><label>Van Ranst et al.(2010)Van Ranst, Verdoodt, and
Baert</label><?label vanranstSoilMappingAfrica2010?><mixed-citation>Van Ranst, E., Verdoodt, A., and Baert, G.: Soil Mapping in Africa at
the Crossroads: Work to Make up for Lost Ground, Meded. Zitt.
K. Acad. overzeese Wet, 56, 147–163, 2010.
 </mixed-citation></ref><?xmltex \hack{\newpage}?>
      <ref id="bib1.bibx81"><?xmltex \def\ref@label{{Veldkamp et~al.(2020)Veldkamp, Schmidt, Powers, and
Corre}}?><label>Veldkamp et al.(2020)Veldkamp, Schmidt, Powers, and
Corre</label><?label veldkampDeforestationReforestationImpacts2020?><mixed-citation>Veldkamp, E., Schmidt, M., Powers, J. S., and Corre, M. D.: Deforestation and
Reforestation Impacts on Soils in the Tropics, Nat. Rev. Earth   Environ., 1, 590–605, <ext-link xlink:href="https://doi.org/10.1038/s43017-020-0091-5" ext-link-type="DOI">10.1038/s43017-020-0091-5</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx82"><?xmltex \def\ref@label{{Viscarra~Rossel and
Brus(2018)}}?><label>Viscarra Rossel and
Brus(2018)</label><?label viscarrarosselCostefficiencyReliabilityTwo2018?><mixed-citation>Viscarra Rossel, R. A. and Brus, D. J.: The Cost-Efficiency and Reliability of
Two Methods for Soil Organic C Accounting: The Cost-Efficiency and
Reliability of Two Methods for Soil Organic C Accounting, Land
Degradation &amp; Development, 29, 506–520, <ext-link xlink:href="https://doi.org/10.1002/ldr.2887" ext-link-type="DOI">10.1002/ldr.2887</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bibx83"><?xmltex \def\ref@label{{Viscarra~Rossel et~al.(2016)Viscarra~Rossel, Behrens, {Ben-Dor},
Brown, Dematt{\^{e}}, Shepherd, Shi, Stenberg, Stevens, Adamchuk, A{\"{i}}chi,
Barth{\`{e}}s, Bartholomeus, Bayer, Bernoux, B{\"{o}}ttcher, Brodsk{\'{y}}, Du,
Chappell, Fouad, Genot, Gomez, Grunwald, Gubler, Guerrero, Hedley, Knadel,
Morr{\'{a}}s, Nocita, {Ramirez-Lopez}, Roudier, Campos, Sanborn, Sellitto,
Sudduth, Rawlins, Walter, Winowiecki, Hong, and
Ji}}?><label>Viscarra Rossel et al.(2016)Viscarra Rossel, Behrens, Ben-Dor,
Brown, Demattê, Shepherd, Shi, Stenberg, Stevens, Adamchuk, Aïchi,
Barthès, Bartholomeus, Bayer, Bernoux, Böttcher, Brodský, Du,
Chappell, Fouad, Genot, Gomez, Grunwald, Gubler, Guerrero, Hedley, Knadel,
Morrás, Nocita, Ramirez-Lopez, Roudier, Campos, Sanborn, Sellitto,
Sudduth, Rawlins, Walter, Winowiecki, Hong, and
Ji</label><?label viscarrarosselGlobalSpectralLibrary2016?><mixed-citation>Viscarra Rossel, R. A., Behrens, T., Ben-Dor, E., Brown, D. J., Demattê,
J. A. M., Shepherd, K. D., Shi, Z., Stenberg, B., Stevens, A., Adamchuk, V.,
Aïchi, H., Barthès, B. G., Bartholomeus, H. M., Bayer, A. D.,
Bernoux, M., Böttcher, K., Brodský, L., Du, C. W., Chappell, A.,
Fouad, Y., Genot, V., Gomez, C., Grunwald, S., Gubler, A., Guerrero, C.,
Hedley, C. B., Knadel, M., Morrás, H. J. M., Nocita, M., Ramirez-Lopez,
L., Roudier, P., Campos, E. M. R., Sanborn, P., Sellitto, V. M., Sudduth,
K. A., Rawlins, B. G., Walter, C., Winowiecki, L. A., Hong, S. Y., and Ji,
W.: A Global Spectral Library to Characterize the World's Soil, Earth-Sci.   Rev., 155, 198–230, <ext-link xlink:href="https://doi.org/10.1016/j.earscirev.2016.01.012" ext-link-type="DOI">10.1016/j.earscirev.2016.01.012</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bibx84"><?xmltex \def\ref@label{{Vohland et~al.(2016)Vohland, Harbich, Ludwig, Emmerling, and
{Thiele-Bruhn}}}?><label>Vohland et al.(2016)Vohland, Harbich, Ludwig, Emmerling, and
Thiele-Bruhn</label><?label vohlandQuantificationSoilVariables2016?><mixed-citation>Vohland, M., Harbich, M., Ludwig, M., Emmerling, C., and Thiele-Bruhn, S.:
Quantification of Soil Variables in a Heterogeneous Soil Region With
VIS-NIR-SWIR Data Using Different Statistical
Sampling and Modeling Strategies, IEEE Journal of Selected Topics in
Applied Earth Observations and Remote Sensing, 9, 4011–4021,
<ext-link xlink:href="https://doi.org/10.1109/JSTARS.2016.2572879" ext-link-type="DOI">10.1109/JSTARS.2016.2572879</ext-link>, 2016.
</mixed-citation></ref><?xmltex \hack{\newpage}?>
      <ref id="bib1.bibx85"><?xmltex \def\ref@label{{Vollset et~al.(2020)Vollset, Goren, Yuan, Cao, Smith, Hsiao,
Bisignano, Azhar, Castro, Chalek, Dolgert, Frank, Fukutaki, Hay, Lozano,
Mokdad, Nandakumar, Pierce, Pletcher, Robalik, Steuben, Wunrow, Zlavog, and
Murray}}?><label>Vollset et al.(2020)Vollset, Goren, Yuan, Cao, Smith, Hsiao,
Bisignano, Azhar, Castro, Chalek, Dolgert, Frank, Fukutaki, Hay, Lozano,
Mokdad, Nandakumar, Pierce, Pletcher, Robalik, Steuben, Wunrow, Zlavog, and
Murray</label><?label vollsetFertilityMortalityMigration2020?><mixed-citation>Vollset, S. E., Goren, E., Yuan, C.-W., Cao, J., Smith, A. E., Hsiao, T.,
Bisignano, C., Azhar, G. S., Castro, E., Chalek, J., Dolgert, A. J., Frank,
T., Fukutaki, K., Hay, S. I., Lozano, R., Mokdad, A. H., Nandakumar, V.,
Pierce, M., Pletcher, M., Robalik, T., Steuben, K. M., Wunrow, H. Y., Zlavog,
B. S., and Murray, C. J. L.: Fertility, Mortality, Migration, and Population
Scenarios for 195 Countries and Territories from 2017 to 2100: A Forecasting
Analysis for the Global Burden of Disease Study, The Lancet, 396,
1–22, <ext-link xlink:href="https://doi.org/10.1016/S0140-6736(20)30677-2" ext-link-type="DOI">10.1016/S0140-6736(20)30677-2</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx86"><?xmltex \def\ref@label{{Wetterlind and
Stenberg(2010)}}?><label>Wetterlind and
Stenberg(2010)</label><?label wetterlindNearinfraredSpectroscopyWithinfield2010?><mixed-citation>Wetterlind, J. and Stenberg, B.: Near-Infrared Spectroscopy for within-Field
Soil Characterization: Small Local Calibrations Compared with National
Libraries Spiked with Local Samples, Europ. J. Soil Sci., 61,
823–843, <ext-link xlink:href="https://doi.org/10.1111/j.1365-2389.2010.01283.x" ext-link-type="DOI">10.1111/j.1365-2389.2010.01283.x</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bibx87"><?xmltex \def\ref@label{{Wise and Gallagher(1996)}}?><label>Wise and Gallagher(1996)</label><?label wiseProcessChemometricsApproach1996?><mixed-citation>Wise, B. M. and Gallagher, N. B.: The Process Chemometrics Approach to Process
Monitoring and Fault Detection, Journal of Process Control, 6, 329–348,
<ext-link xlink:href="https://doi.org/10.1016/0959-1524(96)00009-1" ext-link-type="DOI">10.1016/0959-1524(96)00009-1</ext-link>, 1996.</mixed-citation></ref>
      <ref id="bib1.bibx88"><?xmltex \def\ref@label{{Wise and Roginski(2015)}}?><label>Wise and Roginski(2015)</label><?label wiseCalibrationModelMaintenance2015?><mixed-citation>Wise, B. M. and Roginski, R. T.: A Calibration Model Maintenance Roadmap,
IFAC-PapersOnLine, 48, 260–265, <ext-link xlink:href="https://doi.org/10.1016/j.ifacol.2015.08.191" ext-link-type="DOI">10.1016/j.ifacol.2015.08.191</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx89"><?xmltex \def\ref@label{{Wold et~al.(1984)Wold, Ruhe, Wold, and
Dunn}}?><label>Wold et al.(1984)Wold, Ruhe, Wold, and
Dunn</label><?label woldCollinearityProblemLinear1984?><mixed-citation>Wold, S., Ruhe, A., Wold, H., and Dunn, III, W. J.: The Collinearity
Problem, in: Linear Regression, The Partial Least Squares (PLS)
Approach to Generalized Inverses, SIAM Journal on Scientific and
Statistical Computing, 5, 735–743, <ext-link xlink:href="https://doi.org/10.1137/0905052" ext-link-type="DOI">10.1137/0905052</ext-link>, 1984.</mixed-citation></ref>
      <ref id="bib1.bibx90"><?xmltex \def\ref@label{{Wold et~al.(2001)Wold, Trygg, Berglund, and
Antti}}?><label>Wold et al.(2001)Wold, Trygg, Berglund, and
Antti</label><?label woldRecentDevelopmentsPLS2001?><mixed-citation>Wold, S., Trygg, J., Berglund, A., and Antti, H.: Some Recent Developments in
PLS Modeling, Chemometrics and Intelligent Laboratory Systems, 58,
131–150, <ext-link xlink:href="https://doi.org/10.1016/S0169-7439(01)00156-3" ext-link-type="DOI">10.1016/S0169-7439(01)00156-3</ext-link>, 2001.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>The central African soil spectral library: a new soil infrared repository and a geographical prediction analysis</article-title-html>
<abstract-html><p>Information on soil properties is crucial for soil preservation, the improvement of food security, and the provision of ecosystem services. In particular, for the African continent, spatially explicit information on soils and their ability to sustain these services is still scarce. To address data gaps, infrared spectroscopy has achieved great success as a cost-effective solution to quantify soil properties in recent decades. Here, we present a mid-infrared soil spectral library (SSL) for central Africa (CSSL) that can predict key soil properties, allowing for future soil estimates with a minimal need for expensive and time-consuming  wet chemistry. Currently, our CSSL contains over 1800 soil samples from 10 distinct geoclimatic regions throughout the Congo Basin and along the Albertine Rift. For the analysis, we selected six regions from the CSSL, for which we built predictive models for total carbon (TC) and total nitrogen (TN) using an existing continental SSL (African Soil Information Service, AfSIS SSL; <i>n</i> = 1902) that does not include central African soils. Using memory-based learning (MBL), we explored three different strategies at decreasing degrees of geographic extrapolation, using models built with (1) the AfSIS SSL only, (2) AfSIS SSL combined with the five remaining central African regions, and (3) a combination of AfSIS SSL, the remaining five regions, and selected samples from the target region (spiking). For this last strategy we introduce a method for spiking MBL models. We found that when using the AfSIS SSL only to predict the six central African regions, the root mean square error of the predictions (RMSE<sub>pred</sub>) was between 3.85–8.74 and 0.40–1.66&thinsp;g kg<sup>−1</sup> for TC and TN, respectively. The ratio of performance to the interquartile distance (RPIQ<sub>pred</sub>) ranged between 0.96–3.95 for TC and 0.59–2.86 for TN. While the effect of the second strategy compared to the first strategy was mixed, the third strategy, spiking with samples from the target regions, could clearly reduce the RMSE<sub>pred</sub> to 3.19–7.32&thinsp;g kg<sup>−1</sup> for TC and 0.24–0.89&thinsp;g kg<sup>−1</sup> for TN. RPIQ<sub>pred</sub> values were increased to ranges of 1.43–5.48 and 1.62–4.45 for TC and TN, respectively. In general, predicted TC and TN for soils of each of the six regions were accurate; the effect of spiking and avoiding geographical extrapolation was noticeably large. We conclude that our CSSL adds valuable soil diversity that can improve predictions for the Congo Basin region compared to using the continental AfSIS SSL alone; thus, analyses of other soils in central Africa will be able to profit from a more diverse spectral feature space. Given these promising results, the library comprises an important tool to facilitate economical soil analyses and predict soil properties in an understudied yet critical region of Africa. Our SSL is openly available for application and for enlargement with more spectral and reference data to further improve soil diagnostic accuracy and cost-effectiveness.</p></abstract-html>
<ref-html id="bib1.bib1"><label>Angelopoulou et al.(2020)Angelopoulou, Balafoutis, Zalidis, and
Bochtis</label><mixed-citation>
Angelopoulou, T., Balafoutis, A., Zalidis, G., and Bochtis, D.: From
Laboratory to Proximal Sensing Spectroscopy for Soil Organic Carbon
Estimation – A Review, Sustainability, 12, 1–24,
<a href="https://doi.org/10.3390/su12020443" target="_blank">https://doi.org/10.3390/su12020443</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>Baert(1995)</label><mixed-citation>
Baert, G.: Properties and Chemical Management Aspects of Soils on Different
Parent Rocks in the Lower Zaire, Doctoral thesis, Ghent University,
Ghent, Belgium, 1995.
</mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>Baert et al.(2009)Baert, Van Ranst, Ngongo, Kasongo, Verdoodt,
Mujinya, and Mukalay</label><mixed-citation>
Baert, G., Van Ranst, E., Ngongo, M., Kasongo, E., Verdoodt, A., Mujinya, B.,
and Mukalay, J.: Guide Des Sols En R.D. Congo. Tome II:
Description et Données Physico-Chimiques de Profils Types.,
Imprimé par l'Ecole Technique Salama, Lubumbashi, R.D. Congo, 2009.
</mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>Baert et al.(2013)Baert, Van Ranst, Ngongo, and
Verdoodt</label><mixed-citation>
Baert, G., Van Ranst, E., Ngongo, M., and Verdoodt, A.: Soil Survey in DR
Congo  –  from 1935 until Today, Meded. Zitt. K. Acad. overzeese
Wet, 59, 345–362, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>Ballabio and
Consonni(2013)</label><mixed-citation>
Ballabio, D. and Consonni, V.: Classification Tools in Chemistry. Part 1:
Linear Models, PLS-DA, Analytical Methods, 5, 3790–3798,
<a href="https://doi.org/10.1039/c3ay40582f" target="_blank">https://doi.org/10.1039/c3ay40582f</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>Barthès et al.(2020)Barthès, Kouakoua, Coll, Clairotte,
Moulin, Saby, Le Cadre, Etayo, and
Chevallier</label><mixed-citation>
Barthès, B. G., Kouakoua, E., Coll, P., Clairotte, M., Moulin, P., Saby,
N. P., Le Cadre, E., Etayo, A., and Chevallier, T.: Improvement in Spectral
Library-Based Quantification of Soil Properties Using Representative Spiking
and Local Calibration  –  The Case of Soil Inorganic Carbon
Prediction by Mid-Infrared Spectroscopy, Geoderma, 369, 114272,
<a href="https://doi.org/10.1016/j.geoderma.2020.114272" target="_blank">https://doi.org/10.1016/j.geoderma.2020.114272</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>Baumann(2020)</label><mixed-citation>
Baumann, P.: Simplerspec: Soil and Plant Spectroscopic Model Building and
Prediction, r package version 0.1.0.9001, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>Baumgartner et al.(2020)Baumgartner, Barthel, Drake, Bauters,
Makelele, Mugula, Summerauer, Gallarotti, Cizungu Ntaboba, Van Oost, Boeckx,
Doetterl, Werner, and Six</label><mixed-citation>
Baumgartner, S., Barthel, M., Drake, T. W., Bauters, M., Makelele, I. A., Mugula, J. K., Summerauer, L., Gallarotti, N., Cizungu Ntaboba, L., Van Oost, K., Boeckx, P., Doetterl, S., Werner, R. A., and Six, J.: Seasonality, drivers, and isotopic composition of soil CO<sub>2</sub> fluxes from tropical forests of the Congo Basin, Biogeosciences, 17, 6207–6218, <a href="https://doi.org/10.5194/bg-17-6207-2020" target="_blank">https://doi.org/10.5194/bg-17-6207-2020</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>Bauters et al.(2015)Bauters, Ampoorter, Huygens, Kearsley,
De Haulleville, Sellan, Verbeeck, Boeckx, and
Verheyen</label><mixed-citation>
Bauters, M., Ampoorter, E., Huygens, D., Kearsley, E., De Haulleville, T.,
Sellan, G., Verbeeck, H., Boeckx, P., and Verheyen, K.: Functional Identity
Explains Carbon Sequestration in a 77-Year-Old Experimental Tropical
Plantation, Ecosphere, 6, 198, <a href="https://doi.org/10.1890/ES15-00342.1" target="_blank">https://doi.org/10.1890/ES15-00342.1</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>Bauters et al.(2017)Bauters, Verbeeck, Doetterl, Ampoorter, Baert,
Vermeir, Verheyen, and Boeckx</label><mixed-citation>
Bauters, M., Verbeeck, H., Doetterl, S., Ampoorter, E., Baert, G., Vermeir, P.,
Verheyen, K., and Boeckx, P.: Functional Composition of Tree
Communities Changed Topsoil Properties in an Old Experimental Tropical
Plantation, Ecosystems, 20, 861–871, <a href="https://doi.org/10.1007/s10021-016-0081-0" target="_blank">https://doi.org/10.1007/s10021-016-0081-0</a>,
2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>Bauters et al.(2019a)Bauters, Verbeeck, Rütting,
Barthel, Bazirake Mujinya, Bamba, Bodé, Boyemba, Bulonza, Carlsson,
Eriksson, Makelele, Six, Cizungu Ntaboba, and
Boeckx</label><mixed-citation>
Bauters, M., Verbeeck, H., Rütting, T., Barthel, M., Bazirake Mujinya, B.,
Bamba, F., Bodé, S., Boyemba, F., Bulonza, E., Carlsson, E., Eriksson,
L., Makelele, I., Six, J., Cizungu Ntaboba, L., and Boeckx, P.: Contrasting
Nitrogen Fluxes in African Tropical Forests of the Congo Basin,
Ecological Monographs, 89, 1–17, <a href="https://doi.org/10.1002/ecm.1342" target="_blank">https://doi.org/10.1002/ecm.1342</a>, 2019a.
</mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>Bauters et al.(2019b)Bauters, Vercleyen, Vanlauwe, Six,
Bonyoma, Badjoko, Hubau, Hoyt, Boudin, Verbeeck, and
Boeckx</label><mixed-citation>
Bauters, M., Vercleyen, O., Vanlauwe, B., Six, J., Bonyoma, B., Badjoko, H.,
Hubau, W., Hoyt, A., Boudin, M., Verbeeck, H., and Boeckx, P.: Long-term
Recovery of the Functional Community Assembly and Carbon Pools in an
African Tropical Forest Succession, Biotropica, 51, 319–329,
<a href="https://doi.org/10.1111/btp.12647" target="_blank">https://doi.org/10.1111/btp.12647</a>, 2019b.
</mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>Bauters et al.(2021)Bauters, Moonen, Summerauer, Doetterl, Wasner,
Griepentrog, Mumbanza, Kearsley, Ewango, Boyemba, Six, Muys, Verbist, Boeckx,
and Verheyen</label><mixed-citation>
Bauters, M., Moonen, P., Summerauer, L., Doetterl, S., Wasner, D., Griepentrog,
M., Mumbanza, F. M., Kearsley, E., Ewango, C., Boyemba, F., Six, J., Muys,
B., Verbist, B., Boeckx, P., and Verheyen, K.: Soil Nutrient Depletion
and Tree Functional Composition Shift Following Repeated Clearing in
Secondary Forests of the Congo Basin, Ecosystems, 24, 1422–1435,
<a href="https://doi.org/10.1007/s10021-020-00593-6" target="_blank">https://doi.org/10.1007/s10021-020-00593-6</a>, 2021.
</mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>Beck et al.(2018)Beck, Zimmermann, McVicar, Vergopolan, Berg, and
Wood</label><mixed-citation>
Beck, H. E., Zimmermann, N. E., McVicar, T. R., Vergopolan, N., Berg, A., and
Wood, E. F.: Present and Future Köppen-Geiger Climate
Classification Maps at 1-Km Resolution, Sci. Data, 5, 1–12,
<a href="https://doi.org/10.1038/sdata.2018.214" target="_blank">https://doi.org/10.1038/sdata.2018.214</a>, 2018.
</mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>Bellon-Maurel et al.(2010)Bellon-Maurel, Fernandez-Ahumada,
Palagos, Roger, and McBratney</label><mixed-citation>
Bellon-Maurel, V., Fernandez-Ahumada, E., Palagos, B., Roger, J.-M., and
McBratney, A.: Critical Review of Chemometric Indicators Commonly Used for
Assessing the Quality of the Prediction of Soil Attributes by NIR
Spectroscopy, TrAC Trends in Analytical Chemistry, 29, 1073–1081,
<a href="https://doi.org/10.1016/j.trac.2010.05.006" target="_blank">https://doi.org/10.1016/j.trac.2010.05.006</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>Birgé et al.(2016)Birgé, Bevans, Allen, Angeler, Baer, and
Wall</label><mixed-citation>
Birgé, H. E., Bevans, R. A., Allen, C. R., Angeler, D. G., Baer, S. G., and
Wall, D. H.: Adaptive Management for Soil Ecosystem Services, J. Environ. Manage., 183, 371–378, <a href="https://doi.org/10.1016/j.jenvman.2016.06.024" target="_blank">https://doi.org/10.1016/j.jenvman.2016.06.024</a>,
2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>Briedis et al.(2020)Briedis, Baldock, de Moraes Sá, dos
Santos, and Milori</label><mixed-citation>
Briedis, C., Baldock, J., de Moraes Sá, J. C., dos Santos, J. B., and
Milori, D. M. B. P.: Strategies to Improve the Prediction of Bulk Soil and
Fraction Organic Carbon in Brazilian Samples by Using an Australian
National Mid-Infrared Spectral Library, Geoderma, 373, 1–13,
<a href="https://doi.org/10.1016/j.geoderma.2020.114401" target="_blank">https://doi.org/10.1016/j.geoderma.2020.114401</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>Clairotte et al.(2016)Clairotte, Grinand, Kouakoua, Thébault,
Saby, Bernoux, and Barthès</label><mixed-citation>
Clairotte, M., Grinand, C., Kouakoua, E., Thébault, A., Saby, N. P.,
Bernoux, M., and Barthès, B. G.: National Calibration of Soil Organic
Carbon Concentration Using Diffuse Infrared Reflectance Spectroscopy,
Geoderma, 276, 41–52, <a href="https://doi.org/10.1016/j.geoderma.2016.04.021" target="_blank">https://doi.org/10.1016/j.geoderma.2016.04.021</a>, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>Cox et al.(2013)Cox, Pearson, Booth, Friedlingstein, Huntingford,
Jones, and Luke</label><mixed-citation>
Cox, P. M., Pearson, D., Booth, B. B., Friedlingstein, P., Huntingford, C.,
Jones, C. D., and Luke, C. M.: Sensitivity of Tropical Carbon to Climate
Change Constrained by Carbon Dioxide Variability, Nature, 494, 341–344,
<a href="https://doi.org/10.1038/nature11882" target="_blank">https://doi.org/10.1038/nature11882</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>Curtis et al.(2018)Curtis, Slay, Harris, Tyukavina, and
Hansen</label><mixed-citation>
Curtis, P. G., Slay, C. M., Harris, N. L., Tyukavina, A., and Hansen, M. C.:
Classifying Drivers of Global Forest Loss, Science, 361, 1108–1111,
<a href="https://doi.org/10.1126/science.aau3445" target="_blank">https://doi.org/10.1126/science.aau3445</a>, 2018.
</mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>Dangal et al.(2019)Dangal, Sanderman, Wills, and
Ramirez-Lopez</label><mixed-citation>
Dangal, S., Sanderman, J., Wills, S., and Ramirez-Lopez, L.: Accurate and
Precise Prediction of Soil Properties from a Large Mid-Infrared
Spectral Library, Soil Systems, 3, 1–23, <a href="https://doi.org/10.3390/soilsystems3010011" target="_blank">https://doi.org/10.3390/soilsystems3010011</a>,
2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>Demattê et al.(2019)Demattê, Dotto, Paiva, Sato, Dalmolin,
de Araújo, da Silva, Nanni, ten Caten, Noronha, Lacerda, de
Araújo Filho, Rizzo, Bellinaso, Francelino, Schaefer, Vicente, dos
Santos, de Sá Barretto Sampaio, Menezes, de Souza, Abrahão,
Coelho, Grego, Lani, Fernandes, Gonçalves, Silva, de Menezes, Curi,
Couto, dos Anjos, Ceddia, Pinheiro, Grunwald, Vasques, Marques Júnior,
da Silva, Barreto, Nóbrega, da Silva, de Souza, Valladares, Viana,
da Silva Terra, Horák-Terra, Fiorio, da Silva, Frade Júnior,
Lima, Alba, de Souza Junior, Brefin, Ruivo, Ferreira, Brait, Caetano,
Bringhenti, de Sousa Mendes, Safanelli, Guimarães, Poppiel, e Souza,
Quesada, and do Couto</label><mixed-citation>
Demattê, J. A. M., Dotto, A. C., Paiva, A. F. S., Sato, M. V., Dalmolin, R.
S. D., de Araújo, M. d. S. B., da Silva, E. B., Nanni, M. R., ten
Caten, A., Noronha, N. C., Lacerda, M. P. C., de Araújo Filho, J. C.,
Rizzo, R., Bellinaso, H., Francelino, M. R., Schaefer, C. E. G. R., Vicente,
L. E., dos Santos, U. J., de Sá Barretto Sampaio, E. V., Menezes, R.
S. C., de Souza, J. J. L. L., Abrahão, W. A. P., Coelho, R. M., Grego,
C. R., Lani, J. L., Fernandes, A. R., Gonçalves, D. A. M., Silva, S.
H. G., de Menezes, M. D., Curi, N., Couto, E. G., dos Anjos, L. H. C.,
Ceddia, M. B., Pinheiro, É. F. M., Grunwald, S., Vasques, G. M.,
Marques Júnior, J., da Silva, A. J., Barreto, M. C. d. V., Nóbrega,
G. N., da Silva, M. Z., de Souza, S. F., Valladares, G. S., Viana, J.
H. M., da Silva Terra, F., Horák-Terra, I., Fiorio, P. R., da
Silva, R. C., Frade Júnior, E. F., Lima, R. H. C., Alba, J. M. F., de
Souza Junior, V. S., Brefin, M. D. L. M. S., Ruivo, M. D. L. P., Ferreira,
T. O., Brait, M. A., Caetano, N. R., Bringhenti, I., de Sousa Mendes, W.,
Safanelli, J. L., Guimarães, C. C. B., Poppiel, R. R., e Souza, A. B.,
Quesada, C. A., and do Couto, H. T. Z.: The Brazilian Soil Spectral
Library (BSSL): A General View, Application and Challenges,
Geoderma, 354, 1–21, <a href="https://doi.org/10.1016/j.geoderma.2019.05.043" target="_blank">https://doi.org/10.1016/j.geoderma.2019.05.043</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>Doetterl et al.(2021)Doetterl, Asifiwe, Baert, Bamba, Bauters,
Boeckx, Bukombe, Cadisch, Cizungu, Cooper, Hoyt, Kabaseke, Kalbitz, Kidinda,
Maier, Mainka, Mayrock, Muhindo, Mujinya, Mukotanyi, Nabahungu, Reichenbach,
Rewald, Six, Stegmann, Summerauer, Unseld, Vanlauwe, Van Oost, Verheyen,
Vogel, Wilken, and Fiener</label><mixed-citation>
Doetterl, S., Asifiwe, R. K., Baert, G., Bamba, F., Bauters, M., Boeckx, P., Bukombe, B., Cadisch, G., Cooper, M., Cizungu, L. N., Hoyt, A., Kabaseke, C., Kalbitz, K., Kidinda, L., Maier, A., Mainka, M., Mayrock, J., Muhindo, D., Mujinya, B. B., Mukotanyi, S. M., Nabahungu, L., Reichenbach, M., Rewald, B., Six, J., Stegmann, A., Summerauer, L., Unseld, R., Vanlauwe, B., Van Oost, K., Verheyen, K., Vogel, C., Wilken, F., and Fiener, P.: Organic matter cycling along geochemical, geomorphic, and disturbance gradients in forest and cropland of the African Tropics – project TropSOC database version 1.0, Earth Syst. Sci. Data, 13, 4133–4153, <a href="https://doi.org/10.5194/essd-13-4133-2021" target="_blank">https://doi.org/10.5194/essd-13-4133-2021</a>, 2021.
</mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>Don et al.(2011)Don, Schumacher, and
Freibauer</label><mixed-citation>
Don, A., Schumacher, J., and Freibauer, A.: Impact of Tropical Land-Use Change
on Soil Organic Carbon Stocks – a Meta-Analysis: SOIL ORGANIC CARBON AND
LAND-USE CHANGE, Global Change Biol., 17, 1658–1670,
<a href="https://doi.org/10.1111/j.1365-2486.2010.02336.x" target="_blank">https://doi.org/10.1111/j.1365-2486.2010.02336.x</a>, 2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>Fick and Hijmans(2017)</label><mixed-citation>
Fick, S. E. and Hijmans, R. J.: WorldClim 2: New 1-km Spatial Resolution
Climate Surfaces for Global Land Areas, Int.  J. Clim.,
37, 4302–4315, <a href="https://doi.org/10.1002/joc.5086" target="_blank">https://doi.org/10.1002/joc.5086</a>, 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>Fortin et al.(2016)Fortin, Dale, and
Ver Hoef</label><mixed-citation>
Fortin, M.-J., Dale, M. R., and Ver Hoef, J. M.: Spatial Analysis in
Ecology, in: Wiley StatsRef: Statistics Reference Online, edited
by: Balakrishnan, N., Colton, T., Everitt, B., Piegorsch, W., Ruggeri, F., and
Teugels, J. L., John Wiley &amp; Sons, Ltd, Chichester, UK, 13 pp., 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>Gallarotti et al.(2021)Gallarotti, Barthel, Verhoeven, Pereira,
Bauters, Baumgartner, Drake, Boeckx, Mohn, Longepierre, Mugula, Makelele,
Ntaboba, and Six</label><mixed-citation>
Gallarotti, N., Barthel, M., Verhoeven, E., Pereira, E. I. P., Bauters, M.,
Baumgartner, S., Drake, T. W., Boeckx, P., Mohn, J., Longepierre, M., Mugula,
J. K., Makelele, I. A., Ntaboba, L. C., and Six, J.: In-Depth Analysis of
N2O Fluxes in Tropical Forest Soils of the Congo Basin Combining
Isotope and Functional Gene Analysis, International Society for Microbial
Ecology Journal, ISME J., <a href="https://doi.org/10.1038/s41396-021-01004-x" target="_blank">https://doi.org/10.1038/s41396-021-01004-x</a>, 2021.
</mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>Gomez et al.(2020)Gomez, Chevallier, Moulin, Bouferra, Hmaidi,
Arrouays, Jolivet, and Barthès</label><mixed-citation>
Gomez, C., Chevallier, T., Moulin, P., Bouferra, I., Hmaidi, K., Arrouays, D.,
Jolivet, C., and Barthès, B. G.: Prediction of Soil Organic and Inorganic
Carbon Concentrations in Tunisian Samples by Mid-Infrared Reflectance
Spectroscopy Using a French National Library, Geoderma, 375, 1–14,
<a href="https://doi.org/10.1016/j.geoderma.2020.114469" target="_blank">https://doi.org/10.1016/j.geoderma.2020.114469</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>Goyens et al.(2007)Goyens, Verdoodt, Van De Wauw, Baert, Van Engelen,
Dijkshoorn, and Van Ranst</label><mixed-citation>
Goyens, C., Verdoodt, A., Van De Wauw, J., Baert, G., Van Engelen, V.,
Dijkshoorn, J., and Van Ranst, E.: Base de Données Numériques sur les
SOls et le TERrain (SOTER) de l'Afrique Centrale (RD Congo, Rwanda et
Burundi), Etude et Gestion des Sols, 14, 207–218, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>Guerrero et al.(2010)Guerrero, Zornoza, Gómez, and
Mataix-Beneyto</label><mixed-citation>
Guerrero, C., Zornoza, R., Gómez, I., and Mataix-Beneyto, J.: Spiking of
NIR Regional Models Using Samples from Target Sites: Effect of Model
Size on Prediction Accuracy, Geoderma, 158, 66–77,
<a href="https://doi.org/10.1016/j.geoderma.2009.12.021" target="_blank">https://doi.org/10.1016/j.geoderma.2009.12.021</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>Guerrero et al.(2014)Guerrero, Stenberg, Wetterlind, Viscarra Rossel,
Maestre, Mouazen, Zornoza, Ruiz-Sinoga, and
Kuang</label><mixed-citation>
Guerrero, C., Stenberg, B., Wetterlind, J., Viscarra Rossel, R. A., Maestre,
F. T., Mouazen, A. M., Zornoza, R., Ruiz-Sinoga, J. D., and Kuang, B.:
Assessment of Soil Organic Carbon at Local Scale with Spiked NIR
Calibrations: Effects of Selection and Extra-Weighting on the Spiking Subset,
Europ. J. Soil Sci., 65, 248–263, <a href="https://doi.org/10.1111/ejss.12129" target="_blank">https://doi.org/10.1111/ejss.12129</a>,
2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>Hansen et al.(2013)Hansen, Potapov, Moore, Hancher, Turubanova,
Tyukavina, Thau, Stehman, Goetz, Loveland, Kommareddy, Egorov, Chini,
Justice, and Townshend</label><mixed-citation>
Hansen, M. C., Potapov, P. V., Moore, R., Hancher, M., Turubanova, S. A.,
Tyukavina, A., Thau, D., Stehman, S. V., Goetz, S. J., Loveland, T. R.,
Kommareddy, A., Egorov, A., Chini, L., Justice, C. O., and Townshend, J.
R. G.: High-Resolution Global Maps of 21st-Century Forest Cover
Change, Science, 342, 850–853, <a href="https://doi.org/10.1126/science.1244693" target="_blank">https://doi.org/10.1126/science.1244693</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>Heri-Kazi(2020)</label><mixed-citation>
Heri-Kazi, A. B.: Caractérisation de l'état de dégradation des terres
par l'érosion hydrique dans le Sud-Kivu montagneux à l'Est de la R.D.
Congo, Thèse doctorale, Université Catholique de Louvain, Louvain La
Neuve, 279 pp., 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>Imerzoukene and
Van Ranst(2002)</label><mixed-citation>
Imerzoukene, S. and Van Ranst, E.: Une Banque de Données Pédologiques et
Son S.I.G, Pour Une Nouvelle Politique Agricole Au Rwanda,
Meded. Zitt. K. Acad. overzeese Wet, 47, 299–325, 2002.
</mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>IUSS Working Group
WRB(2015)</label><mixed-citation>
IUSS Working Group WRB: International Soil Classification System for Naming
Soils and Creating Legends for Soil Maps, World Soil Resources Reports
No. 106, FAO, Rome, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>Janik et al.(1998)Janik, Merry, and
Skjemstad</label><mixed-citation>
Janik, L. J., Merry, R. H., and Skjemstad, J. O.: Can Mid Infrared Diffuse
Reflectance Analysis Replace Soil Extractions?, Austr. J.  Exp. Agr., 38, 681–696, <a href="https://doi.org/10.1071/EA97144" target="_blank">https://doi.org/10.1071/EA97144</a>, 1998.
</mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>Jarvis et al.(2008)Jarvis, Reuter, Nelson, and
Guevara</label><mixed-citation>
Jarvis, A., Reuter, H. I., Nelson, A., and Guevara, E.: Hole-Filled Seamless
SRTM Data V4, <a href="https://srtm.csi.cgiar.org" target="_blank"/> (last access: 20 December 2020), 2008.
</mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>Jones et al.(2013)Jones, Breuning-Madsen, Brossard, Dampha,
Deckers, Dewitte, Hallett, Jones, Kilasara, Le Roux, Micheli, Montanarella,
Spaargaren, Tahar, Thiombiano, Van Ranst, Yemefack, and
Zougmore</label><mixed-citation>
Jones, A., Breuning-Madsen, H., Brossard, M., Dampha, A., Deckers, J.,
Dewitte, O., Hallett, S., Jones, R., Kilasara, M., Le Roux, P., Micheli, E.,
Montanarella, L., Spaargaren, O., Tahar, G., Thiombiano, L., Van Ranst, E.,
Yemefack, M., and Zougmore, R.: Soil Atlas of Africa, European
Commission, Publication Office of the European Union, Luxembourg,
<a href="https://doi.org/10.2788/52319" target="_blank">https://doi.org/10.2788/52319</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>Kearsley et al.(2013)Kearsley, de Haulleville, Hufkens, Kidimbu,
Toirambe, Baert, Huygens, Kebede, Defourny, Bogaert, Beeckman, Steppe,
Boeckx, and Verbeeck</label><mixed-citation>
Kearsley, E., de Haulleville, T., Hufkens, K., Kidimbu, A., Toirambe, B.,
Baert, G., Huygens, D., Kebede, Y., Defourny, P., Bogaert, J., Beeckman, H.,
Steppe, K., Boeckx, P., and Verbeeck, H.: Conventional Tree Height – Diameter Relationships Significantly Overestimate Aboveground Carbon Stocks
in the Central Congo Basin, Nat. Commun., 4, 1–8,
<a href="https://doi.org/10.1038/ncomms3269" target="_blank">https://doi.org/10.1038/ncomms3269</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>Kearsley et al.(2017)Kearsley, Verbeeck, Hufkens, Van de Perre,
Doetterl, Baert, Beeckman, Boeckx, and
Huygens</label><mixed-citation>
Kearsley, E., Verbeeck, H., Hufkens, K., Van de Perre, F., Doetterl, S.,
Baert, G., Beeckman, H., Boeckx, P., and Huygens, D.: Functional Community
Structure of African Monodominant <i>Gilbertiodendron
Dewevrei</i> Forest Influenced by Local Environmental Filtering, Ecol.
Evol., 7, 295–304, <a href="https://doi.org/10.1002/ece3.2589" target="_blank">https://doi.org/10.1002/ece3.2589</a>, 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>Lobsey et al.(2017)Lobsey, Viscarra Rossel, Poudier, and
Hedley</label><mixed-citation>
Lobsey, R., C., Viscarra Rossel, R. A., Poudier, P., and Hedley, C. B.:
Rs-local Data-mines Information from Spectral Libraries to Improve Local
Calibrations, Europ. J. Soil Sci., 68, 840–852,
<a href="https://doi.org/10.1111/ejss.12490" target="_blank">https://doi.org/10.1111/ejss.12490</a>, 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>Minten(2017)</label><mixed-citation>
Minten, K.: Development Of a Business Plan For Production And Export Of
Green Coffee Beans From The Equateur Province In The Democratic Republic Of
The Congo, Master thesis, Ghent University, Ghent, Belgium, 68 pp., 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>Moonen et al.(2019)Moonen, Verbist, Boyemba Bosela, Norgrove,
Dondeyne, Van Meerbeek, Kearsley, Verbeeck, Vermeir, Boeckx, and
Muys</label><mixed-citation>
Moonen, P. C., Verbist, B., Boyemba Bosela, F., Norgrove, L., Dondeyne, S.,
Van Meerbeek, K., Kearsley, E., Verbeeck, H., Vermeir, P., Boeckx, P., and
Muys, B.: Disentangling How Management Affects Biomass Stock and Productivity
of Tropical Secondary Forests Fallows, Sci. Tot. Environ., 659,
101–114, <a href="https://doi.org/10.1016/j.scitotenv.2018.12.138" target="_blank">https://doi.org/10.1016/j.scitotenv.2018.12.138</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>Mujinya(2012)</label><mixed-citation>
Mujinya, B. B.: Effects of Macrotermes Termites on the Mineralogical and
Electro-Chemical Properties of Ferralsol Materials in the Upper
Katanga (D.R. Congo), Doctoral thesis, Ghent University,
Ghent, Belgium, 190 pp., 2012.
</mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>Mujinya et al.(2010)Mujinya, Van Ranst, Verdoodt, Baert, and
Ngongo</label><mixed-citation>
Mujinya, B. B., Van Ranst, E., Verdoodt, A., Baert, G., and Ngongo, L.: Termite
Bioturbation Effects on Electro-Chemical Properties of Ferralsols in the
Upper Katanga (D.R. Congo), Geoderma, 158, 233–241,
<a href="https://doi.org/10.1016/j.geoderma.2010.04.033" target="_blank">https://doi.org/10.1016/j.geoderma.2010.04.033</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>Mujinya et al.(2011)Mujinya, Mees, Boeckx, Bodé, Baert, Erens,
Delefortrie, Verdoodt, Ngongo, and
Van Ranst</label><mixed-citation>
Mujinya, B. B., Mees, F., Boeckx, P., Bodé, S., Baert, G., Erens, H.,
Delefortrie, S., Verdoodt, A., Ngongo, M., and Van Ranst, E.: The Origin of
Carbonates in Termite Mounds of the Lubumbashi Area, D.R.
Congo, Geoderma, 165, 95–105, <a href="https://doi.org/10.1016/j.geoderma.2011.07.009" target="_blank">https://doi.org/10.1016/j.geoderma.2011.07.009</a>,
2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>Mujinya et al.(2013)Mujinya, Mees, Erens, Dumon, Baert, Boeckx,
Ngongo, and Van Ranst</label><mixed-citation>
Mujinya, B. B., Mees, F., Erens, H., Dumon, M., Baert, G., Boeckx, P., Ngongo,
M., and Van Ranst, E.: Clay Composition and Properties in Termite Mounds of
the Lubumbashi Area, D.R. Congo, Geoderma, 192, 304–315,
<a href="https://doi.org/10.1016/j.geoderma.2012.08.010" target="_blank">https://doi.org/10.1016/j.geoderma.2012.08.010</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>Mujinya et al.(2014)Mujinya, Adam, Mees, Bogaert, Vranken, Erens,
Baert, Ngongo, and Van Ranst</label><mixed-citation>
Mujinya, B. B., Adam, M., Mees, F., Bogaert, J., Vranken, I., Erens, H., Baert,
G., Ngongo, M., and Van Ranst, E.: Spatial Patterns and Morphology of Termite
(Macrotermes Falciger) Mounds in the Upper Katanga, D.R.
Congo, Catena, 114, 97–106, <a href="https://doi.org/10.1016/j.catena.2013.10.015" target="_blank">https://doi.org/10.1016/j.catena.2013.10.015</a>, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>Næs(1987)</label><mixed-citation>
Næs, T.: The Design of Calibration in near Infra-Red Reflectance Analysis
by Clustering, J. Chemometr., 1, 121–134,
<a href="https://doi.org/10.1002/cem.1180010207" target="_blank">https://doi.org/10.1002/cem.1180010207</a>, 1987.
</mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>Naes et al.(1990)Naes, Isaksson, and
Kowalski</label><mixed-citation>
Naes, T., Isaksson, T., and Kowalski, B.: Locally Weighted Regression and
Scatter Correction for Near-Infrared Reflectance Data, Anal. Chem.,
62, 664–673, <a href="https://doi.org/10.1021/ac00206a003" target="_blank">https://doi.org/10.1021/ac00206a003</a>, 1990.
</mixed-citation></ref-html>
<ref-html id="bib1.bib51"><label>Ng et al.(2019)Ng, Minasny, Montazerolghaem, Padarian, Ferguson,
Bailey, and McBratney</label><mixed-citation>
Ng, W., Minasny, B., Montazerolghaem, M., Padarian, J., Ferguson, R., Bailey,
S., and McBratney, A. B.: Convolutional Neural Network for Simultaneous
Prediction of Several Soil Properties Using Visible/near-Infrared,
Mid-Infrared, and Their Combined Spectra, Geoderma, 352, 251–267,
<a href="https://doi.org/10.1016/j.geoderma.2019.06.016" target="_blank">https://doi.org/10.1016/j.geoderma.2019.06.016</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib52"><label>Nocita et al.(2014)Nocita, Stevens, Toth, Panagos, van Wesemael,
and Montanarella</label><mixed-citation>
Nocita, M., Stevens, A., Toth, G., Panagos, P., van Wesemael, B., and
Montanarella, L.: Prediction of Soil Organic Carbon Content by Diffuse
Reflectance Spectroscopy Using a Local Partial Least Square Regression
Approach, Soil Biol. Biochem., 68, 337–347,
<a href="https://doi.org/10.1016/j.soilbio.2013.10.022" target="_blank">https://doi.org/10.1016/j.soilbio.2013.10.022</a>, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib53"><label>Nocita et al.(2015)Nocita, Stevens, van Wesemael, Aitkenhead,
Bachmann, Barthès, Ben Dor, Brown, Clairotte, Csorba, Dardenne,
Demattê, Genot, Guerrero, Knadel, Montanarella, Noon, Ramirez-Lopez,
Robertson, Sakai, Soriano-Disla, Shepherd, Stenberg, Towett, Vargas, and
Wetterlind</label><mixed-citation>
Nocita, M., Stevens, A., van Wesemael, B., Aitkenhead, M., Bachmann, M.,
Barthès, B., Ben Dor, E., Brown, D. J., Clairotte, M., Csorba, A.,
Dardenne, P., Demattê, J. A., Genot, V., Guerrero, C., Knadel, M.,
Montanarella, L., Noon, C., Ramirez-Lopez, L., Robertson, J., Sakai, H.,
Soriano-Disla, J. M., Shepherd, K. D., Stenberg, B., Towett, E. K., Vargas,
R., and Wetterlind, J.: Soil Spectroscopy: An Alternative to Wet
Chemistry for Soil Monitoring, in: Advances in Agronomy, Vol. 132,
Elsevier, 139–159, <a href="https://doi.org/10.1016/bs.agron.2015.02.002" target="_blank">https://doi.org/10.1016/bs.agron.2015.02.002</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib54"><label>Padarian et al.(2019)Padarian, Minasny, and
McBratney</label><mixed-citation>
Padarian, J., Minasny, B., and McBratney, A.: Transfer Learning to Localise a
Continental Soil Vis-NIR Calibration Model, Geoderma, 340, 279–288,
<a href="https://doi.org/10.1016/j.geoderma.2019.01.009" target="_blank">https://doi.org/10.1016/j.geoderma.2019.01.009</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib55"><label>R Core Team(2020)</label><mixed-citation>
R Core Team: R: A Language and Environment for Statistical Computing, R
Foundation for Statistical Computing, Vienna, Austria, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib56"><label>Ramirez-Lopez(2020)</label><mixed-citation>
Ramirez-Lopez, L.: Resemble: Regression and Similarity Evaluation for
Memory-Based Learning in Spectral Chemometrics, r package version 2.1.1,
2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib57"><label>Ramirez-Lopez et al.(2013a)Ramirez-Lopez, Behrens,
Schmidt, Rossel, Demattê, and
Scholten</label><mixed-citation>
Ramirez-Lopez, L., Behrens, T., Schmidt, K., Rossel, R. V., Demattê, J.,
and Scholten, T.: Distance and Similarity-Search Metrics for Use with Soil
Vis-NIR Spectra, Geoderma, 199, 43–53,
<a href="https://doi.org/10.1016/j.geoderma.2012.08.035" target="_blank">https://doi.org/10.1016/j.geoderma.2012.08.035</a>, 2013a.
</mixed-citation></ref-html>
<ref-html id="bib1.bib58"><label>Ramirez-Lopez et al.(2013b)Ramirez-Lopez, Behrens,
Schmidt, Stevens, Demattê, and
Scholten</label><mixed-citation>
Ramirez-Lopez, L., Behrens, T., Schmidt, K., Stevens, A., Demattê, J.
A. M., and Scholten, T.: The Spectrum-Based Learner: A New Local Approach
for Modeling Soil Vis–NIR Spectra of Complex Datasets,
Geoderma, 195, 268–279, <a href="https://doi.org/10.1016/j.geoderma.2012.12.014" target="_blank">https://doi.org/10.1016/j.geoderma.2012.12.014</a>,
2013b.
</mixed-citation></ref-html>
<ref-html id="bib1.bib59"><label>Ramirez-Lopez et al.(2014)Ramirez-Lopez, Schmidt, Behrens, van
Wesemael, Demattê, and
Scholten</label><mixed-citation>
Ramirez-Lopez, L., Schmidt, K., Behrens, T., van Wesemael, B., Demattê,
J. A., and Scholten, T.: Sampling Optimal Calibration Sets in Soil Infrared
Spectroscopy, Geoderma, 226, 140–150, <a href="https://doi.org/10.1016/j.geoderma.2014.02.002" target="_blank">https://doi.org/10.1016/j.geoderma.2014.02.002</a>,
2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib60"><label>Ramirez-Lopez et al.(2019)Ramirez-Lopez, Wadoux, Franceschini, Terra,
Marques, Sayão, and Demattê</label><mixed-citation>
Ramirez-Lopez, L., Wadoux, A. M. J.-C., Franceschini, M. H. D., Terra, F. S.,
Marques, K. P. P., Sayão, V. M., and Demattê, J. A. M.: Robust Soil
Mapping at the Farm Scale with Vis-NIR Spectroscopy, Europ.
J. Soil Sci., 70, 378–393, <a href="https://doi.org/10.1111/ejss.12752" target="_blank">https://doi.org/10.1111/ejss.12752</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib61"><label>Rinnan(2014)</label><mixed-citation>
Rinnan, A.: Pre-Processing in Vibrational Spectroscopy  –  When, Why
and How, Anal. Meth., 6, 7124–7129, <a href="https://doi.org/10.1039/C3AY42270D" target="_blank">https://doi.org/10.1039/C3AY42270D</a>, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib62"><label>Sanderman et al.(2020)Sanderman, Savage, and
Dangal</label><mixed-citation>
Sanderman, J., Savage, K., and Dangal, S. R.: Mid-infrared Spectroscopy for
Prediction of Soil Health Indicators in the United States, Soil Sci.
Soc. Am. J., 84, 251–261, <a href="https://doi.org/10.1002/saj2.20009" target="_blank">https://doi.org/10.1002/saj2.20009</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib63"><label>Savitzky and Golay(1964)</label><mixed-citation>
Savitzky, A. and Golay, M. J. E.: Smoothing and Differentiation of Data
by Simplified Least Squares Procedures, Anal. Chem., 36,
1627–1639, <a href="https://doi.org/10.1021/ac60214a047" target="_blank">https://doi.org/10.1021/ac60214a047</a>, 1964.
</mixed-citation></ref-html>
<ref-html id="bib1.bib64"><label>Seidel et al.(2019)Seidel, Hutengs, Ludwig, Thiele-Bruhn, and
Vohland</label><mixed-citation>
Seidel, M., Hutengs, C., Ludwig, B., Thiele-Bruhn, S., and Vohland, M.:
Strategies for the Efficient Estimation of Soil Organic Carbon at the Field
Scale with Vis-NIR Spectroscopy: Spectral Libraries and Spiking vs.
Local Calibrations, Geoderma, 354, 1–13,
<a href="https://doi.org/10.1016/j.geoderma.2019.07.014" target="_blank">https://doi.org/10.1016/j.geoderma.2019.07.014</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib65"><label>Seybold et al.(2019)Seybold, Ferguson, Wysocki, Bailey, Anderson,
Nester, Schoeneberger, Wills, Libohova, Hoover, and
Thomas</label><mixed-citation>
Seybold, C. A., Ferguson, R., Wysocki, D., Bailey, S., Anderson, J., Nester,
B., Schoeneberger, P., Wills, S., Libohova, Z., Hoover, D., and Thomas, P.:
Application of Mid-Infrared Spectroscopy in Soil Survey, Soil
Sci. Soc. Am. J., 83, 1746–1759,
<a href="https://doi.org/10.2136/sssaj2019.06.0205" target="_blank">https://doi.org/10.2136/sssaj2019.06.0205</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib66"><label>Shenk et al.(1997)Shenk, Westerhaus, and
Berzaghi</label><mixed-citation>
Shenk, J. S., Westerhaus, M. O., and Berzaghi, P.: Investigation of a LOCAL
Calibration Procedure for near Infrared Instruments, Journal of Near
Infrared Spectroscopy, 5, 223–232, <a href="https://doi.org/10.1255/jnirs.115" target="_blank">https://doi.org/10.1255/jnirs.115</a>, 1997.
</mixed-citation></ref-html>
<ref-html id="bib1.bib67"><label>Shepherd and Walsh(2007)</label><mixed-citation>
Shepherd, K. D. and Walsh, M. G.: Infrared
Spectroscopy – Enabling an Evidence-Based Diagnostic
Surveillance Approach to Agricultural and Environmental Management
in Developing Countries, Journal of Near Infrared Spectroscopy, 15,
1–19, <a href="https://doi.org/10.1255/jnirs.716" target="_blank">https://doi.org/10.1255/jnirs.716</a>, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib68"><label>Shi et al.(2014)Shi, Wang, Peng, Ji, Liu, Li, and
Viscarra Rossel</label><mixed-citation>
Shi, Z., Wang, Q., Peng, J., Ji, W., Liu, H., Li, X., and Viscarra Rossel,
R. A.: Development of a National VNIR Soil-Spectral Library for Soil
Classification and Prediction of Organic Matter Concentrations, Science China
Earth Sciences, 57, 1671–1680, <a href="https://doi.org/10.1007/s11430-013-4808-x" target="_blank">https://doi.org/10.1007/s11430-013-4808-x</a>, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib69"><label>Shi et al.(2015)Shi, Ji, Viscarra Rossel, Chen, and
Zhou</label><mixed-citation>
Shi, Z., Ji, W., Viscarra Rossel, R. A., Chen, S., and Zhou, Y.: Prediction of
Soil Organic Matter Using a Spatially Constrained Local Partial Least Squares
Regression and the Chinese Vis-NIR Spectral Library, Europ. J. Soil Sci., 66, 679–687, <a href="https://doi.org/10.1111/ejss.12272" target="_blank">https://doi.org/10.1111/ejss.12272</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib70"><label>Sila et al.(2016)Sila, Shepherd, and
Pokhariyal</label><mixed-citation>
Sila, A. M., Shepherd, K. D., and Pokhariyal, G. P.: Evaluating the Utility of
Mid-Infrared Spectral Subspaces for Predicting Soil Properties, Chemometrics
and Intelligent Laboratory Systems, 153, 92–105,
<a href="https://doi.org/10.1016/j.chemolab.2016.02.013" target="_blank">https://doi.org/10.1016/j.chemolab.2016.02.013</a>, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib71"><label>Soriano-Disla et al.(2014)Soriano-Disla, Janik, Viscarra Rossel,
Macdonald, and McLaughlin</label><mixed-citation>
Soriano-Disla, J. M., Janik, L. J., Viscarra Rossel, R. A., Macdonald, L. M.,
and McLaughlin, M. J.: The Performance of Visible, Near-, and
Mid-Infrared Reflectance Spectroscopy for Prediction of Soil
Physical, Chemical, and Biological Properties, Appl. Spec.  Rev., 49, 139–186, <a href="https://doi.org/10.1080/05704928.2013.811081" target="_blank">https://doi.org/10.1080/05704928.2013.811081</a>, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib72"><label>Stevens and Ramirez-Lopez(2020)</label><mixed-citation>
Stevens, A. and Ramirez-Lopez, L.: Prospectr: Miscellaneous Functions for
Processing and Sample Selection of Spectroscopic Data, r package version
0.2.0, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib73"><label>Stevens et al.(2013)Stevens, Nocita, Tóth, Montanarella, and van
Wesemael</label><mixed-citation>
Stevens, A., Nocita, M., Tóth, G., Montanarella, L., and van Wesemael, B.:
Prediction of Soil Organic Carbon at the European Scale by
Visible and Near InfraRed Reflectance Spectroscopy, PLOS ONE, 8,
1–13, <a href="https://doi.org/10.1371/journal.pone.0066409" target="_blank">https://doi.org/10.1371/journal.pone.0066409</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib74"><label>Summerauer(2017)</label><mixed-citation>
Summerauer, L.: Sustainable Agricultural Intensification Methods of
Cassava Based Systems for Improving Livelihoods and Forest
Conservation in the Congo Basin, Master thesis, ETH Zurich, Zurich,
Switzerland, 60 pp., 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib75"><label>Summerauer(2020)</label><mixed-citation>
Summerauer, L.: laura-summerauer/ssl-central-africa: Codes and data for manuscript submission (submission version) (v.1.0), Zenodo [code], <a href="https://doi.org/10.5281/zenodo.4351254" target="_blank">https://doi.org/10.5281/zenodo.4351254</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib76"><label>Tsakiridis et al.(2019)Tsakiridis, Theocharis, Panagos, and
Zalidis</label><mixed-citation>
Tsakiridis, N. L., Theocharis, J. B., Panagos, P., and Zalidis, G. C.: An
Evolutionary Fuzzy Rule-Based System Applied to the Prediction of Soil
Organic Carbon from Soil Spectral Libraries, Applied Soft Computing, 81,
1–18, <a href="https://doi.org/10.1016/j.asoc.2019.105504" target="_blank">https://doi.org/10.1016/j.asoc.2019.105504</a>, 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib77"><label>Tyukavina et al.(2018)Tyukavina, Hansen, Potapov, Parker, Okpa,
Stehman, Kommareddy, and Turubanova</label><mixed-citation>
Tyukavina, A., Hansen, M. C., Potapov, P., Parker, D., Okpa, C., Stehman,
S. V., Kommareddy, I., and Turubanova, S.: Congo Basin Forest Loss
Dominated by Increasing Smallholder Clearing, Sci. Adv., 4, 1–12,
<a href="https://doi.org/10.1126/sciadv.aat2993" target="_blank">https://doi.org/10.1126/sciadv.aat2993</a>, 2018.
</mixed-citation></ref-html>
<ref-html id="bib1.bib78"><label>Tziolas et al.(2019)Tziolas, Tsakiridis, Ben-Dor, Theocharis, and
Zalidis</label><mixed-citation>
Tziolas, N., Tsakiridis, N., Ben-Dor, E., Theocharis, J., and Zalidis, G.: A
Memory-Based Learning Approach Utilizing Combined Spectral Sources and
Geographical Proximity for Improved VIS-NIR-SWIR Soil Properties
Estimation, Geoderma, 340, 11–24, <a href="https://doi.org/10.1016/j.geoderma.2018.12.044" target="_blank">https://doi.org/10.1016/j.geoderma.2018.12.044</a>,
2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib79"><label>Vågen et al.(2020)Vågen, Winowiecki, Desta, Tondoh, Weullow,
Shepherd, and Sila</label><mixed-citation>
Vågen, T.-G., Winowiecki, L. A., Desta, L., Tondoh, E. J., Weullow, E.,
Shepherd, K., and Sila, A.: Mid-Infrared Spectra (MIRS) from ICRAF
Soil and Plant Spectroscopy Laboratory: Africa Soil Information
Service (AfSIS) Phase I 2009-2013, World Agroforestry – Research
Data Repository, V1,  <a href="https://doi.org/10.34725/DVN/QXCWP1" target="_blank">https://doi.org/10.34725/DVN/QXCWP1</a>,
2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib80"><label>Van Ranst et al.(2010)Van Ranst, Verdoodt, and
Baert</label><mixed-citation>
Van Ranst, E., Verdoodt, A., and Baert, G.: Soil Mapping in Africa at
the Crossroads: Work to Make up for Lost Ground, Meded. Zitt.
K. Acad. overzeese Wet, 56, 147–163, 2010.

</mixed-citation></ref-html>
<ref-html id="bib1.bib81"><label>Veldkamp et al.(2020)Veldkamp, Schmidt, Powers, and
Corre</label><mixed-citation>
Veldkamp, E., Schmidt, M., Powers, J. S., and Corre, M. D.: Deforestation and
Reforestation Impacts on Soils in the Tropics, Nat. Rev. Earth   Environ., 1, 590–605, <a href="https://doi.org/10.1038/s43017-020-0091-5" target="_blank">https://doi.org/10.1038/s43017-020-0091-5</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib82"><label>Viscarra Rossel and
Brus(2018)</label><mixed-citation>
Viscarra Rossel, R. A. and Brus, D. J.: The Cost-Efficiency and Reliability of
Two Methods for Soil Organic C Accounting: The Cost-Efficiency and
Reliability of Two Methods for Soil Organic C Accounting, Land
Degradation &amp; Development, 29, 506–520, <a href="https://doi.org/10.1002/ldr.2887" target="_blank">https://doi.org/10.1002/ldr.2887</a>, 2018.
</mixed-citation></ref-html>
<ref-html id="bib1.bib83"><label>Viscarra Rossel et al.(2016)Viscarra Rossel, Behrens, Ben-Dor,
Brown, Demattê, Shepherd, Shi, Stenberg, Stevens, Adamchuk, Aïchi,
Barthès, Bartholomeus, Bayer, Bernoux, Böttcher, Brodský, Du,
Chappell, Fouad, Genot, Gomez, Grunwald, Gubler, Guerrero, Hedley, Knadel,
Morrás, Nocita, Ramirez-Lopez, Roudier, Campos, Sanborn, Sellitto,
Sudduth, Rawlins, Walter, Winowiecki, Hong, and
Ji</label><mixed-citation>
Viscarra Rossel, R. A., Behrens, T., Ben-Dor, E., Brown, D. J., Demattê,
J. A. M., Shepherd, K. D., Shi, Z., Stenberg, B., Stevens, A., Adamchuk, V.,
Aïchi, H., Barthès, B. G., Bartholomeus, H. M., Bayer, A. D.,
Bernoux, M., Böttcher, K., Brodský, L., Du, C. W., Chappell, A.,
Fouad, Y., Genot, V., Gomez, C., Grunwald, S., Gubler, A., Guerrero, C.,
Hedley, C. B., Knadel, M., Morrás, H. J. M., Nocita, M., Ramirez-Lopez,
L., Roudier, P., Campos, E. M. R., Sanborn, P., Sellitto, V. M., Sudduth,
K. A., Rawlins, B. G., Walter, C., Winowiecki, L. A., Hong, S. Y., and Ji,
W.: A Global Spectral Library to Characterize the World's Soil, Earth-Sci.   Rev., 155, 198–230, <a href="https://doi.org/10.1016/j.earscirev.2016.01.012" target="_blank">https://doi.org/10.1016/j.earscirev.2016.01.012</a>, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib84"><label>Vohland et al.(2016)Vohland, Harbich, Ludwig, Emmerling, and
Thiele-Bruhn</label><mixed-citation>
Vohland, M., Harbich, M., Ludwig, M., Emmerling, C., and Thiele-Bruhn, S.:
Quantification of Soil Variables in a Heterogeneous Soil Region With
VIS-NIR-SWIR Data Using Different Statistical
Sampling and Modeling Strategies, IEEE Journal of Selected Topics in
Applied Earth Observations and Remote Sensing, 9, 4011–4021,
<a href="https://doi.org/10.1109/JSTARS.2016.2572879" target="_blank">https://doi.org/10.1109/JSTARS.2016.2572879</a>, 2016.

</mixed-citation></ref-html>
<ref-html id="bib1.bib85"><label>Vollset et al.(2020)Vollset, Goren, Yuan, Cao, Smith, Hsiao,
Bisignano, Azhar, Castro, Chalek, Dolgert, Frank, Fukutaki, Hay, Lozano,
Mokdad, Nandakumar, Pierce, Pletcher, Robalik, Steuben, Wunrow, Zlavog, and
Murray</label><mixed-citation>
Vollset, S. E., Goren, E., Yuan, C.-W., Cao, J., Smith, A. E., Hsiao, T.,
Bisignano, C., Azhar, G. S., Castro, E., Chalek, J., Dolgert, A. J., Frank,
T., Fukutaki, K., Hay, S. I., Lozano, R., Mokdad, A. H., Nandakumar, V.,
Pierce, M., Pletcher, M., Robalik, T., Steuben, K. M., Wunrow, H. Y., Zlavog,
B. S., and Murray, C. J. L.: Fertility, Mortality, Migration, and Population
Scenarios for 195 Countries and Territories from 2017 to 2100: A Forecasting
Analysis for the Global Burden of Disease Study, The Lancet, 396,
1–22, <a href="https://doi.org/10.1016/S0140-6736(20)30677-2" target="_blank">https://doi.org/10.1016/S0140-6736(20)30677-2</a>, 2020.
</mixed-citation></ref-html>
<ref-html id="bib1.bib86"><label>Wetterlind and
Stenberg(2010)</label><mixed-citation>
Wetterlind, J. and Stenberg, B.: Near-Infrared Spectroscopy for within-Field
Soil Characterization: Small Local Calibrations Compared with National
Libraries Spiked with Local Samples, Europ. J. Soil Sci., 61,
823–843, <a href="https://doi.org/10.1111/j.1365-2389.2010.01283.x" target="_blank">https://doi.org/10.1111/j.1365-2389.2010.01283.x</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib87"><label>Wise and Gallagher(1996)</label><mixed-citation>
Wise, B. M. and Gallagher, N. B.: The Process Chemometrics Approach to Process
Monitoring and Fault Detection, Journal of Process Control, 6, 329–348,
<a href="https://doi.org/10.1016/0959-1524(96)00009-1" target="_blank">https://doi.org/10.1016/0959-1524(96)00009-1</a>, 1996.
</mixed-citation></ref-html>
<ref-html id="bib1.bib88"><label>Wise and Roginski(2015)</label><mixed-citation>
Wise, B. M. and Roginski, R. T.: A Calibration Model Maintenance Roadmap,
IFAC-PapersOnLine, 48, 260–265, <a href="https://doi.org/10.1016/j.ifacol.2015.08.191" target="_blank">https://doi.org/10.1016/j.ifacol.2015.08.191</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib89"><label>Wold et al.(1984)Wold, Ruhe, Wold, and
Dunn</label><mixed-citation>
Wold, S., Ruhe, A., Wold, H., and Dunn, III, W. J.: The Collinearity
Problem, in: Linear Regression, The Partial Least Squares (PLS)
Approach to Generalized Inverses, SIAM Journal on Scientific and
Statistical Computing, 5, 735–743, <a href="https://doi.org/10.1137/0905052" target="_blank">https://doi.org/10.1137/0905052</a>, 1984.
</mixed-citation></ref-html>
<ref-html id="bib1.bib90"><label>Wold et al.(2001)Wold, Trygg, Berglund, and
Antti</label><mixed-citation>
Wold, S., Trygg, J., Berglund, A., and Antti, H.: Some Recent Developments in
PLS Modeling, Chemometrics and Intelligent Laboratory Systems, 58,
131–150, <a href="https://doi.org/10.1016/S0169-7439(01)00156-3" target="_blank">https://doi.org/10.1016/S0169-7439(01)00156-3</a>, 2001.
</mixed-citation></ref-html>--></article>
