<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">ACP</journal-id><journal-title-group>
    <journal-title>Atmospheric Chemistry and Physics</journal-title>
    <abbrev-journal-title abbrev-type="publisher">ACP</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Atmos. Chem. Phys.</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1680-7324</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/acp-19-3645-2019</article-id><title-group><article-title>Constructing a data-driven receptor model for organic and inorganic aerosol
– a synthesis analysis of eight mass<?xmltex \hack{\break}?> spectrometric data sets from a boreal
forest site</article-title><alt-title>Constructing a data-driven receptor model for organic and inorganic aerosol</alt-title>
      </title-group><?xmltex \runningtitle{Constructing a data-driven receptor model for organic and inorganic aerosol}?><?xmltex \runningauthor{M. \"{A}ij\"{a}l\"{a} et al.}?>
      <contrib-group>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Äijälä</surname><given-names>Mikko</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Daellenbach</surname><given-names>Kaspar R.</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-1246-6396</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Canonaco</surname><given-names>Francesco</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Heikkinen</surname><given-names>Liine</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-7837-967X</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff3">
          <name><surname>Junninen</surname><given-names>Heikki</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Petäjä</surname><given-names>Tuukka</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-1881-9044</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Kulmala</surname><given-names>Markku</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-3464-7825</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Prévôt</surname><given-names>André S. H.</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="yes" rid="aff1">
          <name><surname>Ehn</surname><given-names>Mikael</given-names></name>
          <email>mikael.ehn@helsinki.fi</email>
        <ext-link>https://orcid.org/0000-0002-0215-4893</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>Institute for Atmospheric and Earth System Research/Physics, University of Helsinki, Helsinki, Finland</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>Laboratory of Atmospheric Chemistry, Paul Scherrer Institute, Villigen, Switzerland</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>Laboratory of Environmental Physics, University of Tartu, Tartu, Estonia</institution>
        </aff>
      </contrib-group>
      <author-notes><corresp id="corr1">Mikael Ehn (mikael.ehn@helsinki.fi)</corresp></author-notes><pub-date><day>21</day><month>March</month><year>2019</year></pub-date>
      
      <volume>19</volume>
      <issue>6</issue>
      <fpage>3645</fpage><lpage>3672</lpage>
      <history>
        <date date-type="received"><day>6</day><month>October</month><year>2018</year></date>
           <date date-type="rev-request"><day>19</day><month>October</month><year>2018</year></date>
           <date date-type="rev-recd"><day>18</day><month>January</month><year>2019</year></date>
           <date date-type="accepted"><day>15</day><month>February</month><year>2019</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2019 </copyright-statement>
        <copyright-year>2019</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://acp.copernicus.org/articles/.html">This article is available from https://acp.copernicus.org/articles/.html</self-uri><self-uri xlink:href="https://acp.copernicus.org/articles/.pdf">The full text article is available as a PDF file from https://acp.copernicus.org/articles/.pdf</self-uri>
      <abstract><title>Abstract</title>
    <p id="d1e168">The interactions between organic and
inorganic aerosol chemical components are integral to understanding and
modelling climate and health-relevant aerosol physicochemical properties,
such as volatility, hygroscopicity, light scattering and toxicity. This study
presents a synthesis analysis for eight data sets, of non-refractory aerosol
composition, measured at a boreal forest site. The measurements, performed
with an aerosol mass spectrometer, cover in total around 9 months over the
course of 3 years. In our statistical analysis, we use the complete organic
and inorganic unit-resolution mass spectra, as opposed to the more common
approach of only including the organic fraction. The analysis is based on
iterative, combined use of (1) data reduction, (2) classification and
(3) scaling tools, producing a data-driven chemical mass balance type of
model capable of describing site-specific aerosol composition. The receptor
model we constructed was able to explain <inline-formula><mml:math id="M1" display="inline"><mml:mrow><mml:mn mathvariant="normal">83</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">8</mml:mn></mml:mrow></mml:math></inline-formula> % of variation in
data, which increased to <inline-formula><mml:math id="M2" display="inline"><mml:mrow><mml:mn mathvariant="normal">96</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:math></inline-formula> % when signals from low
signal-to-noise variables were not considered. The resulting interpretation
of an extensive set of aerosol mass spectrometric data infers seven distinct
aerosol chemical components for a rural boreal forest site: ammonium sulfate
(<inline-formula><mml:math id="M3" display="inline"><mml:mrow><mml:mn mathvariant="normal">35</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula> % of mass), low and semi-volatile oxidised organic aerosols
(<inline-formula><mml:math id="M4" display="inline"><mml:mrow><mml:mn mathvariant="normal">27</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">8</mml:mn></mml:mrow></mml:math></inline-formula> % and <inline-formula><mml:math id="M5" display="inline"><mml:mrow><mml:mn mathvariant="normal">12</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula> %), biomass burning organic aerosol (<inline-formula><mml:math id="M6" display="inline"><mml:mrow><mml:mn mathvariant="normal">11</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula> %), a nitrate-containing organic aerosol type (<inline-formula><mml:math id="M7" display="inline"><mml:mrow><mml:mn mathvariant="normal">7</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula> %),
ammonium nitrate (<inline-formula><mml:math id="M8" display="inline"><mml:mrow><mml:mn mathvariant="normal">5</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula> %), and hydrocarbon-like organic aerosol (<inline-formula><mml:math id="M9" display="inline"><mml:mrow><mml:mn mathvariant="normal">3</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> %). Some of the additionally observed, rare outlier aerosol types
likely emerge due to surface ionisation effects and likely represent amine
compounds from an unknown source and alkaline metals from emissions of a
nearby district heating plant. Compared to traditional, ion-balance-based
inorganics apportionment schemes for aerosol mass spectrometer data, our
statistics-based method provides an improved, more robust approach, yielding
readily useful information for the modelling of submicron atmospheric
aerosols physical and chemical properties. The results also shed light on the
division between organic and inorganic aerosol types and dynamics of salt
formation in aerosol. Equally importantly, the combined methodology
exemplifies an iterative analysis, using consequent analysis steps by a
combination of statistical methods. Such an approach offers new ways to home
in on physicochemically sensible solutions with minimal need for a priori
information or analyst interference. We therefore suggest that similar
statistics-based approaches offer significant potential for un- or semi-supervised machine-learning applications in future analyses of aerosol
mass spectrometric data.</p>
  </abstract>
    </article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <title>Introduction</title>
      <p id="d1e287">Along with particle size, aerosol chemical composition is fundamental in
understanding aerosol physicochemical properties such as hygroscopicity,
volatility, optics and toxicity (Bilde et al., 2015; Swietlicki et al., 2008;
Zimmermann, 2015). In the past decade aerosol mass spectrometry has provided
a way to quantitatively resolve basic chemical<?pagebreak page3646?> composition of aerosol in near
real time. This not only enables basic chemical speciation into organic and
common inorganic ion species, but also produces a wealth of complex mass
spectrometric data. It has since become clear that these data sets, although
superficially hard to interpret, are rich in chemical information and their
statistical analysis yields considerable new knowledge. However, tapping into
this information source requires use of advanced analysis tools and
chemometric methods (i.e. “using mathematical and statistical methods to
provide maximum chemical information by analysing chemical data”; Kowalski,
1975). Consequently, advanced statistical methods for data reduction have
quickly gained traction in aerosol mass spectrometry, and are presently
widely used for deconvolution of complex organic mass spectra into their
underlying components. Specifically, the positive matrix factorisation
algorithm (PMF; Paatero and Tapper, 1994) has achieved a predominant status
as the state-of-the-art analysis tool for deconvolving aerosol mass
spectrometric data. Factorisation methods such as PMF notably allow for the
condensation of information found in high-dimension data matrices into a
manageable number of factors, corresponding to aerosol chemical species,
sources or processes, for example. Data reduction often additionally allows
for improved visualisation, aiding in interpretation of the underlying
aerosol chemical phenomena.</p>
      <p id="d1e290">In exploratory factor analysis, the principal difficulties often relate to
deciding the optimal number of factors, choosing between multiple solutions
of mathematically similar quality, and estimating the reliability and
uncertainty of the results. Lacking robust but easy-to-use mathematical
tools, the selection and interpretation of factorisation solutions remains
prone to subjective bias by the analyst. Specifically, while analyst-imposed
additional constraints in factorisation may sometimes be required to reduce
rotational uncertainty and extract minor factors in data (e.g. Canonaco et
al., 2013; Crippa et al., 2014) such procedures are especially prone to
analyst-subjective decisions. Evaluation and verification of a factorisation
solution thus generally requires meticulous study and understanding of, for
example, correlations with auxiliary data, temporal changes and cycles and spectral
references. While statistics-driven methods for spectra comparison and
classification as of yet remain marginal in aerosol mass spectrometry, they
do show promise in their capability to automatically group similar spectra
based on their chemically relevant features, producing comparable
classifications to those performed manually by expert analysts
(Äijälä et al., 2017; Rebotier and Prather, 2007; Freutel et
al., 2013).</p>
      <p id="d1e293">The overwhelming majority of PMF analyses to date from aerosol mass spectrometer (AMS) have been
performed on the organic fraction alone (Zhang et al., 2011). Contrary to
popular belief, there exists no tenable reasons to limit chemometric
analysis to organic signals, as exemplified by the analyses of Sun et al. (2012) and Hao et al. (2014). Although it requires some additional data
preparation and processing, inclusion of inorganics provides additional
insight into, for example, salt formation in aerosol. In this work, we apply data
reduction and classification methods for analysing organic and inorganic
aerosol mass spectral data from several measurement campaigns in the boreal
forest. We then derive a comprehensive receptor model resolving the dominant
aerosol categories at the site. In addition, by presenting an example of a
semi-supervised, statistics-driven analysis of large mass spectral data
sets, we hope to pave the way for machine-learning-based data analysis
approaches, reducing the need for expert analyst input and subjective
judgement at each step.</p>
</sec>
<sec id="Ch1.S2">
  <title>Methods</title>
      <p id="d1e302">Our instrumentation, data processing, measurement site and analysis
algorithms have been comprehensively described in previous literature, to
which we refer in the corresponding sections. Thus, we focus on the new
aspects of this work, showing how the individual methods can be connected to
form an analysis chain, and to exemplify how chemometric information can be
propagated through it. In short, we will first cover the measurement site,
SMEAR II (Station for Measuring Ecosystem–Atmosphere Relations) and the sets
of data available to us (Sect. 2.1). We then describe our mass spectrometer
instrument and preparation of data (Sect. 2.2). In Sect. 2.3, we will briefly
go through the various statistical tools and algorithms, covering the basics
of data factorisation, classification of spectra using a clustering algorithm
and clustering solution evaluation, and detail the pre- and post-weighting
involved. Section 2.4 describes typical reference methods for inorganics and
nitrate apportionment: an ion balance scheme and a separate parameterisation
for estimating organonitrate loading, to provide a comparison for the
inorganic speciation from our statistics-based receptor model. Finally, in
Sect. 2.5, we present a summarised, step-by-step description of how the
methods were combined to produce a receptor model for aerosol composition at
the measurement site.</p>
<sec id="Ch1.S2.SS1">
  <title>Measurement site and collection of data</title>
<sec id="Ch1.S2.SS1.SSS1">
  <title>The SMEAR II site</title>
      <p id="d1e315">The AMS data of this study were collected at the SMEAR II site in Hyytiälä, southern
Finland (61<inline-formula><mml:math id="M10" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>50<inline-formula><mml:math id="M11" display="inline"><mml:msup><mml:mi/><mml:mo>′</mml:mo></mml:msup></mml:math></inline-formula>40<inline-formula><mml:math id="M12" display="inline"><mml:msup><mml:mi/><mml:mrow><mml:mo>′</mml:mo><mml:mo>′</mml:mo></mml:mrow></mml:msup></mml:math></inline-formula> N, 24<inline-formula><mml:math id="M13" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>17<inline-formula><mml:math id="M14" display="inline"><mml:msup><mml:mi/><mml:mo>′</mml:mo></mml:msup></mml:math></inline-formula>013<inline-formula><mml:math id="M15" display="inline"><mml:msup><mml:mi/><mml:mrow><mml:mo>′</mml:mo><mml:mo>′</mml:mo></mml:mrow></mml:msup></mml:math></inline-formula> E). The site is a
well-known and well-equipped atmospheric research station, representing rural,
background atmosphere in the boreal forest biome. The site and earlier
measurements therein have been extensively described and reported in
the literature (e.g. Hari and Kulmala, 2005; Williams et al., 2011;
Äijälä et al., 2017).</p>
      <p id="d1e379">The environment consists mostly of forests dominated by Scots pine (<italic>Pinus Sylvestris</italic>) – 90 %
of land in the nearest 50 km, and 94 % in the nearest 5 km is forested
(Williams et al., 2011).</p>
      <?pagebreak page3647?><p id="d1e385">A large part of the aerosol loading at SMEAR II is attributable to regional
biogenic secondary organic aerosol (SOA; Corrigan et al., 2013; Crippa et
al., 2014; Allan et al., 2006) and long-range transport from industrial
regions in southern Finland, western Russia and central Europe (Kulmala et
al., 2000; Patokoski et al., 2015; Niemi et al., 2009; Sogacheva et al.,
2005). Regional anthropogenic aerosol sources include the towns Orivesi (pop.
9500; 19 km south) and Tampere (pop. 213 000; 48 km south-west), as well
as two sawmills and a pellet factory in the village of Korkeakoski, Juupajoki
(7 km east-south-east of the station). The surrounding countryside is
sparsely populated (5–10 inhabitants km<inline-formula><mml:math id="M16" display="inline"><mml:msup><mml:mi/><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula>), and although emissions
from agriculture, traffic, domestic heating, cooking and other combustion
sources (saunas, barbecues, agricultural machinery etc.) are limited, they
are clearly observable at the station and may increase aerosol loading in
often plume-type pollution events. The anthropogenic organic aerosols were
further analysed previously (Äijälä et al., 2017).</p>

<?xmltex \floatpos{t}?><table-wrap id="Ch1.T1" specific-use="star"><label>Table 1</label><caption><p id="d1e403">Data sets used in this study and their time frames
(dd.mm.yyyy).</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="5">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:colspec colnum="5" colname="col5" align="left"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Data set</oasis:entry>
         <oasis:entry colname="col2">Data set</oasis:entry>
         <oasis:entry colname="col3">Campaign</oasis:entry>
         <oasis:entry colname="col4">Start time</oasis:entry>
         <oasis:entry colname="col5">End time</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">number</oasis:entry>
         <oasis:entry colname="col2">name</oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">I</oasis:entry>
         <oasis:entry colname="col2">“May 2008”</oasis:entry>
         <oasis:entry colname="col3">EUCAARI</oasis:entry>
         <oasis:entry colname="col4">29.04.2008</oasis:entry>
         <oasis:entry colname="col5">08.06.2008</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">II</oasis:entry>
         <oasis:entry colname="col2">“Sep 2008”</oasis:entry>
         <oasis:entry colname="col3">EUCAARI</oasis:entry>
         <oasis:entry colname="col4">10.09.2008</oasis:entry>
         <oasis:entry colname="col5">15.10.2008</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">III</oasis:entry>
         <oasis:entry colname="col2">“Mar 2009”</oasis:entry>
         <oasis:entry colname="col3">EUCAARI</oasis:entry>
         <oasis:entry colname="col4">04.03.2009</oasis:entry>
         <oasis:entry colname="col5">06.04.2009</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">IV</oasis:entry>
         <oasis:entry colname="col2">“May 2009”</oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4">29.04.2009</oasis:entry>
         <oasis:entry colname="col5">28.05.2009</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">V</oasis:entry>
         <oasis:entry colname="col2">“Jun 2009”</oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4">12.06.2009</oasis:entry>
         <oasis:entry colname="col5">08.08.2009</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">VI</oasis:entry>
         <oasis:entry colname="col2">“Aug 2009”</oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4">13.08.2009</oasis:entry>
         <oasis:entry colname="col5">19.09.2009</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">VII</oasis:entry>
         <oasis:entry colname="col2">“Summer 2010”</oasis:entry>
         <oasis:entry colname="col3">HUMPPA-COPEC</oasis:entry>
         <oasis:entry colname="col4">09.07.2010</oasis:entry>
         <oasis:entry colname="col5">07.08.2010</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">VIII</oasis:entry>
         <oasis:entry colname="col2">“Winter 2010”</oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4">10.11.2010</oasis:entry>
         <oasis:entry colname="col5">07.01.2011</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

<?xmltex \floatpos{t}?><table-wrap id="Ch1.T2" specific-use="star"><label>Table 2</label><caption><p id="d1e606">For months when AMS data were
available, percentages indicate the fraction of days with at least one data
point.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="13">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right"/>
     <oasis:colspec colnum="8" colname="col8" align="right"/>
     <oasis:colspec colnum="9" colname="col9" align="right"/>
     <oasis:colspec colnum="10" colname="col10" align="right"/>
     <oasis:colspec colnum="11" colname="col11" align="right"/>
     <oasis:colspec colnum="12" colname="col12" align="right"/>
     <oasis:colspec colnum="13" colname="col13" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Jan</oasis:entry>
         <oasis:entry colname="col3">Feb</oasis:entry>
         <oasis:entry colname="col4">Mar</oasis:entry>
         <oasis:entry colname="col5">Apr</oasis:entry>
         <oasis:entry colname="col6">May</oasis:entry>
         <oasis:entry colname="col7">Jun</oasis:entry>
         <oasis:entry colname="col8">Jul</oasis:entry>
         <oasis:entry colname="col9">Aug</oasis:entry>
         <oasis:entry colname="col10">Sep</oasis:entry>
         <oasis:entry colname="col11">Oct</oasis:entry>
         <oasis:entry colname="col12">Nov</oasis:entry>
         <oasis:entry colname="col13">Dec</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">2008</oasis:entry>
         <oasis:entry colname="col2">–</oasis:entry>
         <oasis:entry colname="col3">–</oasis:entry>
         <oasis:entry colname="col4">–</oasis:entry>
         <oasis:entry colname="col5">–</oasis:entry>
         <oasis:entry colname="col6">65 %</oasis:entry>
         <oasis:entry colname="col7">20 %</oasis:entry>
         <oasis:entry colname="col8">–</oasis:entry>
         <oasis:entry colname="col9">–</oasis:entry>
         <oasis:entry colname="col10">70 %</oasis:entry>
         <oasis:entry colname="col11">48 %</oasis:entry>
         <oasis:entry colname="col12">–</oasis:entry>
         <oasis:entry colname="col13">–</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">2009</oasis:entry>
         <oasis:entry colname="col2">–</oasis:entry>
         <oasis:entry colname="col3">–</oasis:entry>
         <oasis:entry colname="col4">94 %</oasis:entry>
         <oasis:entry colname="col5">23 %</oasis:entry>
         <oasis:entry colname="col6">90 %</oasis:entry>
         <oasis:entry colname="col7">63 %</oasis:entry>
         <oasis:entry colname="col8">81 %</oasis:entry>
         <oasis:entry colname="col9">87 %</oasis:entry>
         <oasis:entry colname="col10">63 %</oasis:entry>
         <oasis:entry colname="col11">–</oasis:entry>
         <oasis:entry colname="col12">–</oasis:entry>
         <oasis:entry colname="col13">–</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">2010</oasis:entry>
         <oasis:entry colname="col2">–</oasis:entry>
         <oasis:entry colname="col3">–</oasis:entry>
         <oasis:entry colname="col4">–</oasis:entry>
         <oasis:entry colname="col5">–</oasis:entry>
         <oasis:entry colname="col6">–</oasis:entry>
         <oasis:entry colname="col7">–</oasis:entry>
         <oasis:entry colname="col8">74 %</oasis:entry>
         <oasis:entry colname="col9">68 %</oasis:entry>
         <oasis:entry colname="col10">–</oasis:entry>
         <oasis:entry colname="col11">–</oasis:entry>
         <oasis:entry colname="col12">47 %</oasis:entry>
         <oasis:entry colname="col13">100 %</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">2011</oasis:entry>
         <oasis:entry colname="col2">23 %</oasis:entry>
         <oasis:entry colname="col3">–</oasis:entry>
         <oasis:entry colname="col4">–</oasis:entry>
         <oasis:entry colname="col5">–</oasis:entry>
         <oasis:entry colname="col6">–</oasis:entry>
         <oasis:entry colname="col7">–</oasis:entry>
         <oasis:entry colname="col8">–</oasis:entry>
         <oasis:entry colname="col9">–</oasis:entry>
         <oasis:entry colname="col10">–</oasis:entry>
         <oasis:entry colname="col11">–</oasis:entry>
         <oasis:entry colname="col12">–</oasis:entry>
         <oasis:entry colname="col13">–</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

</sec>
<sec id="Ch1.S2.SS1.SSS2">
  <title>Data sets</title>
      <p id="d1e873">In this study, the aerosol composition was monitored by an AMS between 2008
and 2011, during several short measurement campaigns. Notable larger,
intensive campaigns at the time were the EUCAARI project (2008–2009; Kulmala
et al., 2009, 2011) and HUMPPA-COPEC (2010; Williams et al.,
2011; Corrigan et al., 2013). The sets of data used along with their
time frames are shown in Table 1. Data availability by year and month is
presented in Table 2.</p>
</sec>
</sec>
<sec id="Ch1.S2.SS2">
  <title>Instrumentation, data processing and preparation</title>
<sec id="Ch1.S2.SS2.SSS1">
  <title>The aerosol mass spectrometer (AMS) instrument and basic data
processing</title>
      <p id="d1e888">The mass spectrometric data for this study were acquired with a
Time-of-Flight Aerosol Mass Spectrometer (ToF-AMS), developed by Aerodyne
Research Inc. (Billerica, MA, US). AMS instruments in general have been
described by Canagaratna et al. (2007), and the compact ToF analyser version
(CToF) used in this study by Drewnick et al. (2005). Additional, more
specific details related to the specific instrument we used are available in
our previous study (Äijälä et al., 2017).</p>
      <p id="d1e891">In brief, the AMS instrument sucks sample aerosol from atmospheric pressure
to vacuum conditions through an inlet system consisting of a critical
orifice and a particle concentrating aerodynamic lens (Liu et al., 2007).
The sample aerosol beam is directed at a vaporiser operated at 600 <inline-formula><mml:math id="M17" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C, whereby flash vaporisation of non-refractory aerosol components
occurs. The resulting vapour is ionised using 70 eV electron impact
ionisation – a well-characterised hard ionisation technique, resulting in
rather universal and predictable but highly fragmenting ionisation. Finally,
the ions are led to an orthogonal extraction reflectron time-of-flight mass
analyser, where the ions' mass-to-charge (<inline-formula><mml:math id="M18" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula>) ratios are measured.</p>
      <p id="d1e915">The per-amu (atomic mass unit) analyser signal is subsequently quantified
based on instrument response calibrations and corrections (among others the
correction for relative ionisation efficiency between the species, RIE;
Allan et al., 2004; Supplement Sect. S4). Individual,
unit-mass-resolution amu signals are then chemically speciated, based on
chemical information on fragmentation and air composition (see Allan et al.,
2003b, for details). Additional, specific minor modifications to our
instrument have been discussed in our previous work (Äijälä et
al., 2017).</p>
</sec>
<sec id="Ch1.S2.SS2.SSS2">
  <title>Data preparation and down-weighting</title>
      <p id="d1e924">After basic processing, the data were further prepared, to serve as input for
factorisation (described in following Sect. 2.3). The organic and
inorganic data and related uncertainties were extracted, and down-weighting
of signals performed. The procedure for extraction and preparation of AMS
organic signal and related error matrices has been described by Allan et al. (2003b) and Ulbrich et al. (2009).</p>
      <p id="d1e927">In short, measurement points or variables with missing data were omitted and
error matrices calculated, based on a function accounting for both counting-statistics-induced uncertainty as well as background noise from the detector
and electronics. The signals were then down-weighted by multiplying the
error-matrix-conveyed uncertainty values for low signal-to-noise ratio (SNR)
variables with a scalar: “weak” variables (SNR <inline-formula><mml:math id="M19" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 3) were
down-weighted by a factor of 2 and “bad” variables (SNR <inline-formula><mml:math id="M20" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 1) by
10. The procedure for inorganics (<inline-formula><mml:math id="M21" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M22" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M23" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, Chl, i.e.
sulfates, nitrates, ammonia and chloride species) was similar to that used
for the organics (“org”), including for the down-weighting of signals
derived from fragmentation calculations. Analogous to the basic procedure of
down-weighting “duplicate information” organic signals, e.g. those derived
from <inline-formula><mml:math id="M24" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 44 Th (mainly <inline-formula><mml:math id="M25" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">CO</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>), similarly derived inorganic signal
weights were normalised so that their weight of the original plus
“duplicate” signals equalled that of the original signal. Finally, the
matrices for all the ion species (org, <inline-formula><mml:math id="M26" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M27" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M28" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, Chl, in
nitrate equivalent mass) were combined to form the final input matrices for
factorisation, while retaining speciation information in the ion indexing.</p>
</sec>
</sec>
<sec id="Ch1.S2.SS3">
  <title>Statistical methods and algorithms</title>
<sec id="Ch1.S2.SS3.SSS1">
  <title>Positive matrix factorisation</title>
      <?pagebreak page3648?><p id="d1e1048">For factorisation, we used the PMF model developed by Pentti Paatero and
colleagues (Paatero, 1997, 1999; Paatero and Tapper, 1994) and widely used
for analysis of AMS data since 2007 (Lanz et al., 2007b; Zhang et al., 2011).
In brief, PMF is a statistical model, typically resolving a bilinear linear
combination of factor profiles (<inline-formula><mml:math id="M29" display="inline"><mml:mi mathvariant="bold">G</mml:mi></mml:math></inline-formula>) and time series (<inline-formula><mml:math id="M30" display="inline"><mml:mi mathvariant="bold">F</mml:mi></mml:math></inline-formula>)
best describing the measured data matrix (<inline-formula><mml:math id="M31" display="inline"><mml:mi mathvariant="bold">X</mml:mi></mml:math></inline-formula>; Eq. 1). The residual
matrix <inline-formula><mml:math id="M32" display="inline"><mml:mi mathvariant="bold">E</mml:mi></mml:math></inline-formula> then denotes the portion of data left unexplained by the
model (i.e. residual). The PMF model is thus formulated:
              <disp-formula id="Ch1.E1" content-type="numbered"><mml:math id="M33" display="block"><mml:mrow><mml:msub><mml:mi mathvariant="bold">X</mml:mi><mml:mrow><mml:mfenced close=")" open="("><mml:mrow><mml:mi>t</mml:mi><mml:mo>×</mml:mo><mml:mi>v</mml:mi></mml:mrow></mml:mfenced></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi mathvariant="bold">G</mml:mi><mml:mrow><mml:mfenced open="(" close=")"><mml:mrow><mml:mi>t</mml:mi><mml:mo>×</mml:mo><mml:mi>f</mml:mi></mml:mrow></mml:mfenced></mml:mrow></mml:msub><mml:mo>×</mml:mo><mml:msub><mml:mi mathvariant="bold">F</mml:mi><mml:mrow><mml:mfenced close=")" open="("><mml:mrow><mml:mi>f</mml:mi><mml:mo>×</mml:mo><mml:mi>v</mml:mi></mml:mrow></mml:mfenced></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi mathvariant="bold">E</mml:mi><mml:mrow><mml:mfenced open="(" close=")"><mml:mrow><mml:mi>t</mml:mi><mml:mo>×</mml:mo><mml:mi>v</mml:mi></mml:mrow></mml:mfenced></mml:mrow></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>
            The brackets indicate matrix dimensions, with <inline-formula><mml:math id="M34" display="inline"><mml:mi>v</mml:mi></mml:math></inline-formula> denoting number of variables,
<inline-formula><mml:math id="M35" display="inline"><mml:mi>t</mml:mi></mml:math></inline-formula> the number of time points and <inline-formula><mml:math id="M36" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula> the number of factors. As shown in Eq. (1), the model can be solved for any <inline-formula><mml:math id="M37" display="inline"><mml:mi>f</mml:mi></mml:math></inline-formula> (<inline-formula><mml:math id="M38" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mi>v</mml:mi></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M39" display="inline"><mml:mi>t</mml:mi></mml:math></inline-formula>), requiring it to be
selected by the analyst.</p>
      <p id="d1e1187">The main features setting PMF apart from other similar factorisation models,
and making it particularly suitable for atmospheric aerosol models, are on
the one hand the limitation of factor profiles and time series to positive
values, hence drastically reducing the amount of rotational ambiguity, and on
the other hand the improved error model where the quantity to minimise is the
weighted (typically the measurement uncertainty) residual, resulting in
higher weight for the variables with better SNR. In PMF, the minimum weighted
residual is solved using one of the related algorithms, i.e. PMF2 or
Multilinear Engine 2 (ME-2; Paatero, 1999). Of the two algorithms, ME-2 can
take in additional equations defined by the user, i.e. constraints the
solutions need to adhere to. In this study, when ME-2 constraints were
applied to the factor profiles, we set upper and lower bounds for the allowed
profile solutions. The bounds were based on variability estimates obtained
from earlier analysis, as explained later, in Sect. 2.5. Variability estimate
of the final model is available in the Supplement (Fig. S13). For running the
PMF and ME-2 algorithms, we used the Igor Pro (Wavemetrics Inc.) based SoFi
(v. 4.8) user interface developed by Francesco Canonaco and co-workers at
Paul Scherrer Institute (PSI). The interface allows input of the
pre-processed data and user-selected parameters, and calls on the solver
algorithms (PMF2 or ME-2, depending on assignment) to return a solution to be
displayed and analysed in SoFi (Canonaco et al., 2013).</p>
      <p id="d1e1190">When PMF is used as a standalone method for source attribution, the
selection of solution needs to be carefully validated. Sensitivities towards
a different number of factors, rotations and initialisation seeds are
meticulously analysed, and correlations with auxiliary data are computed. A case
is then made for why the selection is the best possible. Contrarily, in our
analysis approach, we <italic>do not</italic> claim to arrive at optimum solutions for <italic>individual</italic> PMF–ME-2
runs. Instead, we rely on a multitude of data de-convolution runs to uncover
the main structures in the ensemble of all data sets, and use statistical
classification methods to evaluate the general outlook and commonalities
between PMF–ME-2 factors at each analysis phase. As discussed in Sect. 2.5, this trade-off instead enables us to concentrate on best modelling the
entirety <italic>of all data sets</italic>.</p>
</sec>
<sec id="Ch1.S2.SS3.SSS2">
  <title>Relaxed chemical mass balance model</title>
      <p id="d1e1208">To harmonise the description of aerosol components, we constructed a
constrained receptor model, where all the profile components were
constrained. For this purpose we applied a ME-2-based chemical mass balance
(CMB) type of model. CMB models are typically used as receptor models for
cases where source profiles are known, and only the mass loading information
needs resolving (Friedlander, 1973; Gordon, 1988; Hopke, 1991, 2016; Miller et
al., 1972). In such mass-conservation-based models, the observed
loadings are<?pagebreak page3649?> modelled as a sum of multiple individual sources. Although CMB
is often presented mathematically as the sum of loadings (Supplement; Sect. S1, Eq. S1), it can also be thought
of as a special case of the bi-linear model described in Eq. (1). Only
now the profile matrix (<inline-formula><mml:math id="M40" display="inline"><mml:mi mathvariant="bold">F</mml:mi></mml:math></inline-formula>) is assumed fixed, simplifying the problem to
resolving the loading matrix (<inline-formula><mml:math id="M41" display="inline"><mml:mi mathvariant="bold">G</mml:mi></mml:math></inline-formula>) which minimises the residual (<inline-formula><mml:math id="M42" display="inline"><mml:mi mathvariant="bold">E</mml:mi></mml:math></inline-formula>). CMB can be
run using the SoFi interface, using the same ME-2 solver as for PMF and ME-2
applications (Canonaco et al., 2013).</p>
      <p id="d1e1232">In this work, we use a relaxed CMB-like bilinear model (henceforth
abbreviated as r-CMB), where all the source profiles are constrained but
allowed to vary within narrow limits (derived from variability estimates;
see Sect. 2.5; Supplement Fig. S13). In strict technical terms this approach
could be labelled “an extremely constrained ME-2 model”, but we choose to
use the term “relaxed CMB” to differentiate between the typical use of
ME-2 or constraining only part of the profiles, which allows the model
considerably more freedom. We regard our use of the model as much closer to
the idea of constraining all profiles than (semi-)exploratory factorisation
typical for ME-2. The naming also serves to better highlight the conceptual
differences between models in the different analysis phases.</p>
      <p id="d1e1235">Generally, the biggest problems of the CMB models relate to the selection of
source profiles, typically from spectral libraries, and handling of their
uncertainty. In our use, the anchor spectra as well as the limits for their
allowed variabilities are experimentally derived from data, alleviating some
of these typical concerns.</p>
</sec>
<sec id="Ch1.S2.SS3.SSS3">
  <?xmltex \opttitle{$k$-means clustering}?><title><inline-formula><mml:math id="M43" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means clustering</title>
      <p id="d1e1251">For spectra classification, we selected the <inline-formula><mml:math id="M44" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means algorithm, specifically
because in our previous tests it was successful in classifying similar
spectral data. The earlier tests additionally yielded useful information
on the selection of the dissimilarity metric, as well as algorithm initialisation
types and data weighting (Äijälä et al., 2017). The <inline-formula><mml:math id="M45" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means algorithm (e.g.
Ball and Hall, 1965; MacQueen, 1967; Steinhaus, 1956; Jain, 2010) is a rather
simple, iterative algorithm that partitions a group of objects to a
predesignated number of groups or “clusters” based on their relative
distances (i.e. dissimilarities). For each iteration, the algorithm assigns
all objects to their closest centroids, which are then re-calculated from the
mean variable values of the objects in the updated cluster. The aim is to
minimise the within-cluster sum of distance (variance) (<inline-formula><mml:math id="M46" display="inline"><mml:mi>J</mml:mi></mml:math></inline-formula>) between the
objects' (<inline-formula><mml:math id="M47" display="inline"><mml:mrow><mml:msub><mml:mi>C</mml:mi><mml:mi>n</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) locations (<inline-formula><mml:math id="M48" display="inline"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>) and the cluster centroid <inline-formula><mml:math id="M49" display="inline"><mml:mrow><mml:msub><mml:mi mathvariant="italic">μ</mml:mi><mml:mi>n</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>
they are assigned to (Eq. 2):
              <disp-formula id="Ch1.E2" content-type="numbered"><mml:math id="M50" display="block"><mml:mrow><mml:mi>J</mml:mi><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>C</mml:mi><mml:mi>n</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:munder><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>x</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>C</mml:mi><mml:mi>n</mml:mi></mml:msub></mml:mrow></mml:munder><mml:msup><mml:mfenced open="∥" close="∥"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi mathvariant="italic">μ</mml:mi><mml:mi>n</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>
            The <inline-formula><mml:math id="M51" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means algorithm iteratively converges on (any) minimum of total <inline-formula><mml:math id="M52" display="inline"><mml:mi>J</mml:mi></mml:math></inline-formula>
(<inline-formula><mml:math id="M53" display="inline"><mml:mi>C</mml:mi></mml:math></inline-formula>) obtained by summing over all objects <inline-formula><mml:math id="M54" display="inline"><mml:mrow><mml:msub><mml:mi>C</mml:mi><mml:mi>n</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>. To increase chances of
finding a global minimum, repetitions using different initialisations are
used. Specifically, we used the improved stepwise initialisation
“kmeans<inline-formula><mml:math id="M55" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mo>+</mml:mo></mml:mrow></mml:math></inline-formula>” (Arthur and Vassilvitskii, 2007; available in MATLAB v. 2017a
for example, Math Works Inc., Natick, MA, USA).</p>
</sec>
<sec id="Ch1.S2.SS3.SSS4">
  <title>Spectral similarity and mass scaling</title>
      <p id="d1e1407">Based on our earlier metric comparison (Äijälä et al., 2017), we
used (Pearson) correlation as a metric for spectral dissimilarity (or
“distance”, <inline-formula><mml:math id="M56" display="inline"><mml:mi>d</mml:mi></mml:math></inline-formula>; Fortier and Solomon, 1966; Mcquitty, 1966):
              <disp-formula id="Ch1.E3" content-type="numbered"><mml:math id="M57" display="block"><mml:mrow><mml:mi>d</mml:mi><mml:mfenced open="(" close=")"><mml:mrow><mml:mi mathvariant="bold-italic">u</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="bold-italic">v</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mo>-</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">u</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>u</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:mrow></mml:mfenced><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">v</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>v</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:msqrt><mml:mrow><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">u</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>u</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:mrow></mml:mfenced></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:msqrt><mml:msqrt><mml:mrow><mml:msup><mml:mfenced close=")" open="("><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">v</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>v</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:mrow></mml:mfenced></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:msqrt></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
            where <inline-formula><mml:math id="M58" display="inline"><mml:mi mathvariant="bold-italic">u</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M59" display="inline"><mml:mi mathvariant="bold-italic">v</mml:mi></mml:math></inline-formula> are the spectra in vector form, with <inline-formula><mml:math id="M60" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula>
variables as vector components, and <inline-formula><mml:math id="M61" display="inline"><mml:mover accent="true"><mml:mi>u</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:math></inline-formula> and <inline-formula><mml:math id="M62" display="inline"><mml:mover accent="true"><mml:mi>v</mml:mi><mml:mo mathvariant="normal">‾</mml:mo></mml:mover></mml:math></inline-formula> are the
arithmetic mean values of <inline-formula><mml:math id="M63" display="inline"><mml:mi mathvariant="bold-italic">u</mml:mi></mml:math></inline-formula> and <inline-formula><mml:math id="M64" display="inline"><mml:mi mathvariant="bold-italic">v</mml:mi></mml:math></inline-formula>.</p>
      <p id="d1e1612">In clustering mass spectra, data weighting is often applied. Based on
previous tests (Äijälä et al., 2017), we applied mass scaling of
variables, advocated by Stein and Scott and others (Stein and Scott, 1994;
Kim et al., 2012; Horai et al., 2010), giving additional emphasis to higher
mass signals. This common practice is based on the idea that higher mass
fragment ions are more indicative of their parent ions, and thus the
original characteristic composition, while smaller fragments can be produced
from a wider variety of molecular fragmentation events. In mass scaling the
weighted variables (<inline-formula><mml:math id="M65" display="inline"><mml:mover accent="true"><mml:mi>x</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover></mml:math></inline-formula>) are calculated by multiplying the original
variables (<inline-formula><mml:math id="M66" display="inline"><mml:mi>x</mml:mi></mml:math></inline-formula>) by mass-to-charge-specific weights (<inline-formula><mml:math id="M67" display="inline"><mml:mi>w</mml:mi></mml:math></inline-formula>), as presented in Eq. (4).
              <disp-formula id="Ch1.E4" content-type="numbered"><mml:math id="M68" display="block"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>x</mml:mi><mml:mo mathvariant="normal" stretchy="false">^</mml:mo></mml:mover><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:msub><mml:mo>×</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:msub><mml:mo>;</mml:mo><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mspace width="0.25em" linebreak="nobreak"/><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msup><mml:mfenced open="(" close=")"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:mfenced><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:msub></mml:mrow></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
            where the scaling factor <inline-formula><mml:math id="M69" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> was optimised for each classification
separately (Supplement; Sect. S2).</p>
</sec>
<sec id="Ch1.S2.SS3.SSS5">
  <title>Silhouette metric and post-weighting</title>
      <?pagebreak page3650?><p id="d1e1735">The optimisation of mass scaling was based on the silhouette metric (later also
abbreviated as “silh”; Rousseeuw, 1987), ranging between <inline-formula><mml:math id="M70" display="inline"><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> to 1 and
providing a straightforward, quantitative way to evaluate performance of the
classification algorithm. The object-specific silhouette value <inline-formula><mml:math id="M71" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>,
defined as
              <disp-formula id="Ch1.E5" content-type="numbered"><mml:math id="M72" display="block"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfenced open="{" close=""><mml:mtable class="array" columnalign="left left"><mml:mtr><mml:mtd><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>-</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>;</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mi mathvariant="normal">for</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mspace width="0.25em" linebreak="nobreak"/><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&lt;</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mn mathvariant="normal">0</mml:mn><mml:mo>;</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mi mathvariant="normal">for</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mspace linebreak="nobreak" width="0.25em"/><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mi>b</mml:mi><mml:mfenced open="(" close=")"><mml:mi>i</mml:mi></mml:mfenced></mml:mrow><mml:mrow><mml:mi>a</mml:mi><mml:mfenced open="(" close=")"><mml:mi>i</mml:mi></mml:mfenced></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mo>;</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mi mathvariant="normal">for</mml:mi><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mspace linebreak="nobreak" width="0.25em"/><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&gt;</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mfenced><mml:mo>,</mml:mo></mml:mrow></mml:math></disp-formula>
            where <inline-formula><mml:math id="M73" display="inline"><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> corresponds to the mean distance to other objects in the same
cluster, and <inline-formula><mml:math id="M74" display="inline"><mml:mrow><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> similarly to the mean distance to objects in the
nearest neighbouring cluster. A silhouette value close to unity indicates
the object is well clustered, while a value close to zero indicates the
classification is uncertain, and the point is likely situated in-between two
possible centroids. A negative cluster value is indicatory of possible
misclassification. Silhouette values can be calculated for any single
cluster as the arithmetic mean of the cluster members' silhouettes, or
similarly as a mean over all objects, to evaluate the quality of the
clustering solution as a whole.</p>
      <p id="d1e1905">In order to mitigate the <inline-formula><mml:math id="M75" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means algorithm's known sensitivity to outliers,
and to improve handling of between-cluster samples, we applied a simple
post-processing to all cluster centroids and variability calculations: the
centroid spectra and variabilities were calculated as <italic>weighted</italic> averages (<inline-formula><mml:math id="M76" display="inline"><mml:mover accent="true"><mml:mi mathvariant="italic">μ</mml:mi><mml:mo mathvariant="normal" stretchy="false">^</mml:mo></mml:mover></mml:math></inline-formula>), and <italic>weighted</italic> standard deviations (<inline-formula><mml:math id="M77" display="inline"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi mathvariant="italic">σ</mml:mi><mml:mo mathvariant="normal" stretchy="false">^</mml:mo></mml:mover><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>; Eq. 6) respectively,
instead of the normal unweighted values (similar to Äijälä et
al., 2017). As weights, we used the object specific silhouette values
<inline-formula><mml:math id="M78" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula> (Eq. 5):

                  <disp-formula specific-use="align" content-type="numbered"><mml:math id="M79" display="block"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd><mml:mstyle class="stylechange" displaystyle="true"/></mml:mtd><mml:mtd><mml:mrow><mml:mstyle displaystyle="true" class="stylechange"/><mml:mover accent="true"><mml:mi mathvariant="italic">μ</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:msubsup><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>v</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>;</mml:mo><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mspace width="0.25em" linebreak="nobreak"/><mml:msup><mml:mover accent="true"><mml:mi mathvariant="italic">σ</mml:mi><mml:mo stretchy="false" mathvariant="normal">^</mml:mo></mml:mover><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:msubsup><mml:mi>s</mml:mi><mml:msup><mml:mfenced close=")" open="("><mml:mrow><mml:mi>v</mml:mi><mml:mo>-</mml:mo><mml:mi mathvariant="italic">μ</mml:mi></mml:mrow></mml:mfenced><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:munderover><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>;</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mlabeledtr id="Ch1.E6"><mml:mtd/><mml:mtd><mml:mstyle class="stylechange" displaystyle="true"/></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mo movablelimits="false">max⁡</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi>s</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:mn mathvariant="normal">0</mml:mn><mml:mo>)</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr></mml:mtable></mml:math></disp-formula>

              where <inline-formula><mml:math id="M80" display="inline"><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are the cluster member objects (spectra) This procedure
down-weights likely misclassified objects (silhouette <inline-formula><mml:math id="M81" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">0</mml:mn></mml:mrow></mml:math></inline-formula>) to zero,
and penalises the more uncertain or questionable assignations (low
silhouette) compared to the decidedly well-clustered objects (silhouette
close to unity). Singleton clusters were omitted from this calculation, and
their variability was thus left undefined.</p>
</sec>
</sec>
<sec id="Ch1.S2.SS4">
  <title>Standard approximations for aerosol inorganic speciation and
organonitrate</title>
<sec id="Ch1.S2.SS4.SSS1">
  <title>Ion balance model for inorganics</title>
      <p id="d1e2152">Aerosol inorganic chemical speciation is better understood than the organic
speciation, due to much lower diversity of the chemical compounds involved.
A variety of aerosol inorganic equilibrium models exist and are typically
used as modules in atmospheric meteorological and air quality models.
However, performing thermodynamic equilibrium calculations is
computationally demanding (e.g. Fountoukis and Nenes, 2007) and requires a
good deal of auxiliary data on thermodynamic conditions and chemical
activities. Due to the complexity of the models and increased data needs,
simpler approximations are often used in connection with AMS inorganic
speciation. In the following ion-balance-scheme description, we denote the
respective AMS ion species molar concentrations in square brackets (e.g.
[<inline-formula><mml:math id="M82" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>], [<inline-formula><mml:math id="M83" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn><mml:mo>-</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>], [<inline-formula><mml:math id="M84" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>-</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula>]).</p>
      <p id="d1e2197">A typical salt formation approximation used for AMS results is the Hong et
al. (2017) ion pairing scheme, used in aerosol volatility and light
scattering models, for example (Hong et al., 2017; Zieger et al., 2015). The
Hong et al. (2017) scheme is based on similar approximation of Gysel et
al. (2007), which in turn is a simplification of the more extensive model by
Reilly and Wood (1969). We modified the Hong et al. (2017) scheme to
additionally allow organonitrate (<inline-formula><mml:math id="M85" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>) and speciate any leftover
[<inline-formula><mml:math id="M86" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] as its own class (“excess <inline-formula><mml:math id="M87" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>”). The full
scheme is available in the Supplement (Sect. S3), and a schematic description
is presented in Fig. 1.</p>
      <p id="d1e2237">Briefly, in the scheme we apply, <inline-formula><mml:math id="M88" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> is first combined with
<inline-formula><mml:math id="M89" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>-</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula> to form ammonium bisulfate and/or ammonium sulfate
depending on the relative concentrations of [<inline-formula><mml:math id="M90" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] and
[<inline-formula><mml:math id="M91" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>-</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula>]. Any leftover [<inline-formula><mml:math id="M92" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] then combines with
[<inline-formula><mml:math id="M93" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn><mml:mo>-</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>], until all [<inline-formula><mml:math id="M94" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>-</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula>] and [<inline-formula><mml:math id="M95" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn><mml:mo>-</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>]
is fully consumed in forming <inline-formula><mml:math id="M96" display="inline"><mml:mrow class="chem"><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and
<inline-formula><mml:math id="M97" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula><inline-formula><mml:math id="M98" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. After this point, any leftover
[<inline-formula><mml:math id="M99" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] is considered “excess” and assigned to a separate
class. For comparability with other models, any nitrate not in
<inline-formula><mml:math id="M100" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula><inline-formula><mml:math id="M101" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> is labelled organic. Despite the label, we note
this class not only encompasses organonitrates, but also any <inline-formula><mml:math id="M102" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">NO</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>
fragment signal from amines and N-containing organics and
may even contain influences of other inorganic nitrate species, such as
<inline-formula><mml:math id="M103" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">KNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, which are not considered separately in this simple model.
Finally, since chloride loadings at the measurement site are generally
negligible, neutralisation of hydrochloric acid (<inline-formula><mml:math id="M104" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mi mathvariant="normal">O</mml:mi></mml:mrow></mml:math></inline-formula> : HCl) was
not included to keep this scheme rather simple. We note that ion balance
schemes depending on relative ion abundances, such as the one described here,
can be sensitive to measurement uncertainties (e.g. errors in RIE values) of
these ratios. The topic is further discussed in the Supplement (Sect. S4)</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F1"><label>Figure 1</label><caption><p id="d1e2470">Schematic representation of the inorganic apportionment scheme. The
scheme is divided into three cases according to the ratio of
[<inline-formula><mml:math id="M105" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] to [<inline-formula><mml:math id="M106" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>-</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula>]. [<inline-formula><mml:math id="M107" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] first
combines with [<inline-formula><mml:math id="M108" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>] to form <inline-formula><mml:math id="M109" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">HSO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (Case 1), then
further to <inline-formula><mml:math id="M110" display="inline"><mml:mrow class="chem"><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (Case 2). In these cases, any nitrate
observed is considered organic. In Case 3 leftover [<inline-formula><mml:math id="M111" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] then
associates with [<inline-formula><mml:math id="M112" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn><mml:mo>-</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] until all the inorganic anions are neutralised. Any leftover
[<inline-formula><mml:math id="M113" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] is labelled as “excess <inline-formula><mml:math id="M114" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>”. A full
description of the scheme is given in the Supplement (Sect. S3).</p></caption>
            <?xmltex \igopts{width=241.848425pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f01.png"/>

          </fig>

<?xmltex \hack{\newpage}?>
</sec>
<?pagebreak page3651?><sec id="Ch1.S2.SS4.SSS2">
  <title>Kiendler-Scharr parameterisation for organonitrate</title>
      <p id="d1e2632">The organic nitrate estimate in the above model is very sensitive to calibration
parameters (see Supplement Sect. S4). Therefore, in addition to the ion-balance-based scheme above, we additionally calculated a particulate organonitrate
mass estimate (<inline-formula><mml:math id="M115" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mrow><mml:mn mathvariant="normal">3</mml:mn><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mi mathvariant="normal">mass</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>), based on the nitrate fragmentation
ratio-based parameterisation of Kiendler-Scharr et al. (2016; Farmer et al., 2010):

                  <disp-formula specific-use="align" content-type="numbered"><mml:math id="M116" display="block"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd><mml:mstyle class="stylechange" displaystyle="true"/></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:msub><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow><mml:mi mathvariant="normal">mass</mml:mi></mml:msub><mml:mo>=</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mlabeledtr id="Ch1.E7"><mml:mtd/><mml:mtd><mml:mstyle displaystyle="true" class="stylechange"/></mml:mtd><mml:mtd><mml:mrow><mml:mstyle class="stylechange" displaystyle="true"/><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mspace width="0.25em" linebreak="nobreak"/><mml:msub><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow><mml:mi mathvariant="normal">total</mml:mi></mml:msub><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mfenced open="(" close=")"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>+</mml:mo><mml:msub><mml:mi>R</mml:mi><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mi>x</mml:mi><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">measured</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">calib</mml:mi></mml:msub></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mfenced close=")" open="("><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>+</mml:mo><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">measured</mml:mi></mml:msub></mml:mrow></mml:mfenced><mml:mi>x</mml:mi><mml:mfenced open="(" close=")"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">calib</mml:mi></mml:msub></mml:mrow></mml:mfenced></mml:mrow></mml:mfrac></mml:mstyle><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mlabeledtr></mml:mtable></mml:math></disp-formula>

              where <inline-formula><mml:math id="M117" display="inline"><mml:mi>R</mml:mi></mml:math></inline-formula> refers to the ratio of nitrate signals at 46 and 30 Th, i.e. <inline-formula><mml:math id="M118" display="inline"><mml:mrow><mml:mi>R</mml:mi><mml:mo>=</mml:mo><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:mrow></mml:math></inline-formula> (<inline-formula><mml:math id="M119" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 46 Th) : <inline-formula><mml:math id="M120" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (<inline-formula><mml:math id="M121" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 30 Th), for organonitrate
(“<inline-formula><mml:math id="M122" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>”), <inline-formula><mml:math id="M123" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula><inline-formula><mml:math id="M124" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> calibration (“calib”) and ambient
measurement (“measured”), respectively. For the parameterisation, we
applied an ion ratio <inline-formula><mml:math id="M125" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">calib</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.42</mml:mn></mml:mrow></mml:math></inline-formula>, taken as the average of mass-spectrum-based AN calibrations (Supplement Sect. S6). An <inline-formula><mml:math id="M126" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> value of 0.1 was
used, based on the estimate by Kiendler-Scharr and co-workers for their
observations on organonitrate spectral properties (Kiendler-Scharr et al.,
2016).</p>
</sec>
</sec>
<sec id="Ch1.S2.SS5">
  <title>Constructing a data-driven r-CMB receptor model</title>
      <p id="d1e2888">As stated in the Introduction, one of the aims of our work was to derive a
robust, harmonised receptor model for the measurement site via explorative
analysis. Considering the large amount of campaigns during different
seasons, resulting in changing aerosol source contributions and mass
spectral profiles, factorisation needed to be performed on a per-campaign
(data set) basis. However, instead of performing traditional PMF complete
with correlation analysis, source validation and the various sensitivity
analyses separately, which would be an arduous task even for a single
measurement set, we used the large amount of data sets to our advantage.
Instead of optimising individual factorisations, we constructed an r-CMB
model applicable to all data sets. A similar task of constructing a
semi-exploratory synthesis aerosol model, albeit one applying a different
methodology, was undertaken and reported by Sofowote et al. (2015).</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F2" specific-use="star"><label>Figure 2</label><caption><p id="d1e2893">A flowchart illustrating the analysis using combined methodology.
After initial data collection and preparation, statistical analysis is
performed in three phases (P-I to P-III). Each phase limits the freedom given
to factorisation from completely free (PMF) to nearly fully constrained
(r-CMB). Finally, we evaluate and interpret the r-CMB model from an aerosol
chemical perspective.</p></caption>
          <?xmltex \igopts{width=384.112205pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f02.png"/>

        </fig>

      <p id="d1e2902">To derive the anchors and constraints for a synthesis r-CMB model, we
analysed the data in three phases (P-I to P-III; Fig. 2), each consisting
of factorisation, classification and silhouette-based post-weighting of
anchor spectra and their allowed variabilities. The allowed variabilities
were constrained by setting upper and lower bounds (the estimated
variability ranges from the previous phase) for factor profiles. In Phases I
and II, a fixed number of 10 factors were resolved. This amount of factors
was semi-arbitrarily chosen, and in our case likely to be somewhat above the
optimal amount for most data sets, leading to over-resolved factor
solutions. However, unlike in traditional PMF analysis, we can use
additional statistical diagnostics and post-processing options available to
deal with potential fallout of unrealistic factor splitting (i.e.
classification for identifying outliers and post-processing down-weighting
or nullifying their influence). Sensitivity to initialisation seed was
examined by performing all runs using 10 initialisation seeds, and generally
selecting the solution with lowest normalised residual. In rare cases of a
physically unrealistic solutions such as the one with the lowest residual (e.g. only
<inline-formula><mml:math id="M127" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> species in a factor), a higher residual solution was chosen
instead. We conclude the solutions were generally insensitive to seed
selection, especially for the factors with non-negligible mass contribution.</p>
<sec id="Ch1.S2.SS5.SSS1">
  <title>Phase I: anthropogenic aerosols</title>
      <p id="d1e2921">In phase I (P-I), we performed unconstrained factorisation for all the eight data
sets. With 10 factors this resulted in a total of 80 factors of mass spectra. We
then determined the dominant spectra classes using <inline-formula><mml:math id="M128" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means clustering. To
that purpose, we applied optimised mass scaling for improved data structure,
and used silhouette diagnostics to evaluate the optimal number of clusters.
We identified the known, common anthropogenic aerosol classes from the
silhouette-weighted cluster centroids. This is also an approach advocated by
Crippa et al. (2014) in their similar work on a synthesis analysis of
several data sets.</p>
      <p id="d1e2931">For a cluster centroid to qualify as an anchor for further phases of our
analysis, we applied the following two criteria: (1) the spectra forming the
cluster were present in multiple (<inline-formula><mml:math id="M129" display="inline"><mml:mrow><mml:mo>≥</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:math></inline-formula>) data sets, and (2) the spectra
were interpretable chemically and had adequate support from previous
studies in the form of literature and/or calibrations. We note that defining
what constitutes ”interpretable” or “adequate support” is inevitably
an analyst (subjective) decision, so we endeavour to make our reasoning
transparent in the respective discussion sections. Adhering to criterion (1)
also means that factors showing up only for one to two campaigns, due to special
conditions (emission, meteorology etc.), are omitted from the final r-CMB
model. We will briefly cover some of the more interesting “outlier
observations” in Sect. 3.4. At the end of phase I, a number of
constrained anchor spectra and within-cluster-variabilities were obtained.
In this case, these corresponded to four anthropogenic classes, which will
be discussed in more detail in the results section.</p>
</sec>
<sec id="Ch1.S2.SS5.SSS2">
  <title>Phase II: biogenic, secondary organic aerosols</title>
      <p id="d1e2951">Using the anchors and within-cluster variabilities, we re-ran factorisation
as in P-I, except now partly constrained (ME-2; 4 of 10 factors constrained
using anchors from P-I). In phase II, we focused on analysing the remaining
free factors, likely corresponding to the biogenic and assumedly more
variable factors (Canonaco et al., 2015; Crippa et al., 2014). The procedure
for classification and the selection criteria for the<?pagebreak page3652?> (assumedly) biogenic
SOA in this phase were the same as in phase I.</p>
      <p id="d1e2954">Due to the data-driven analysis approach, specifically the constrained
factors being selected from phase I, we do not expect major changes between
phase I and phase II (P-II) results. While arguably the methodology could be
further developed to constrain the r-CMB components directly from the phase I
result, phase II of our analysis currently serves several purposes: (1) it
should narrow down the solution space for improved description of the
various SOA types, by constraining the anthropogenic, assumedly primary
aerosols. (2) Compared to P-I, the allowed solutions are more similar for all
data sets in P-II, which reduces the scatter of the factorisation solutions.
This reduces the spectral variability (uncertainty) arising from the
analysis process itself, allowing us to iteratively converge on more
realistic limit values for the constraints. Ultimately, the limits should
reflect the actual, natural chemical variabilities within the aerosol types.
(3) Similarity of results between successive, un- or semi-constrained phases
allows evaluation of stability, reliability and repeatability of the method,
so that it is not e.g. overly sensitive to rotational ambiguity or
initialisation parameters of algorithms. This is important since the method
described here is new, and its robustness needs to be demonstrated, but less
so in potential later use.</p>
</sec>
<sec id="Ch1.S2.SS5.SSS3">
  <title>Phase III: final, constrained receptor model</title>
      <p id="d1e2963">In phase III (P-III), we constructed the r-CMB receptor model. In this phase, all
the factors were constrained using anchors and variabilities from the
previous phase result. The number of components in the final r-CMB model, in
our case 7, was equal to the total number of selected aerosol types in phase II. With these model constraints, we performed runs for each of the eight data
sets separately. Using the resulting <inline-formula><mml:math id="M130" display="inline"><mml:mrow><mml:mn mathvariant="normal">8</mml:mn><mml:mo>×</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula> factor profiles, we
determined the likely range of variability for the aerosol types, and
calculated final, silhouette-weighted reference spectra for the components
by performing a final round of clustering.</p>
</sec>
</sec>
</sec>
<sec id="Ch1.S3">
  <title>Results and discussion</title>
      <p id="d1e2986">In Sect. 3.1, we briefly describe the results from analysis phases I to
III (P-I to P-III; corresponding to Sect. 3.1.1 to 3.1.3) but
concentrate more on the receptor model results and their interpretation
(Sect. 3.2). Finally we will compare our results with reference methods
(Sect. 3.3). Comparison results are available in the literature for organic
aerosol components (Sect. 3.3.1), and in Sect. 3.2 we will compare inorganic
speciation with the alternative inorganic attribution methods, described in
Methods (Sect. 2.4). Finally, we briefly describe some of the outlier
observations which contain potentially interesting chemical information
(Sect. 3.4).</p>
      <p id="d1e2989">When interpreting and identifying aerosol components, we evaluate spectral
similarity using the same similarity metric (mass scaled correlation) as for
the clustering (Eqs. 3 and 4). We thus report mass scaled squared
correlation coefficients (<inline-formula><mml:math id="M131" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula>) between reference spectra and our
corresponding final spectrum for the class (P-III silhouette-weighted
centroids; <inline-formula><mml:math id="M132" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.81</mml:mn></mml:mrow></mml:math></inline-formula>). For easier comparability, all ratios and
fractions of signals presented in the following sections are similarly
calculated from the corresponding final spectra (P-III).</p><?xmltex \hack{\newpage}?>
<?pagebreak page3653?><sec id="Ch1.S3.SS1">
  <title>Receptor model construction steps</title>
<sec id="Ch1.S3.SS1.SSS1">
  <title>Phase I: identification of anthropogenic aerosol components</title>
      <p id="d1e3031">In phase I, we performed unconstrained PMF runs using 10 factors for all 8 data sets separately. The resulting 80-factor spectra were subsequently
clustered. Maximal data structure (silhouette 0.56) was achieved at mass
scaling <inline-formula><mml:math id="M133" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2.12</mml:mn></mml:mrow></mml:math></inline-formula> for 17 clusters (for details on silhouette analysis,
see Supplement, Sect. S2). The eight clusters with largest
population for the phase I solution are shown in Fig. 3, and the rest in
Sect. 3.4, where outlier observations are further discussed. Generally,
the solutions agreed closely on the largest clusters, lending credibility to
the robustness of the approach. The solutions differed mainly regarding
outlier classification, which is of secondary importance for our r-CMB
model, since outliers are discarded from the model.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F3" specific-use="star"><label>Figure 3</label><caption><p id="d1e3051">The eight largest clusters for P-I classification of factorisation
results. Cluster centroids (coloured bars) and variabilities (error bars) are
silhouette-weighted averages and standard deviations for the cluster members.
The main anthropogenic aerosol types were identified as clusters no. 2
(“Ammonium sulfate”, AS), no. 4 (“Hydrocarbon-like organic aerosol”,
HOA), no. 5 (“Biomass burning organic aerosol”, BBOA) and no. 8 (“Ammonium
nitrate”, AN). Cluster number, silhouette and population (<inline-formula><mml:math id="M134" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula>) are shown in
panel titles.</p></caption>
            <?xmltex \igopts{width=497.923228pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f03.png"/>

          </fig>

      <p id="d1e3067">Unsurprisingly, the classification returns two large clusters of organic
aerosol resembling the ubiquitous low-volatile oxidised
organic aerosols (no. 1; LV-OOA) and semi-volatile oxidised organic aerosol
(SV-OOA; e.g. Aiken et al., 2007; Jimenez et al., 2009; Zhang et al., 2011).
Comparing to library spectra, the aerosol type dominated by <inline-formula><mml:math id="M135" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 44 Th
(<inline-formula><mml:math id="M136" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">CO</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>) (no. 1) best matches with LV-OOA and OOA-I (oxidised
organic aerosol, a historical label corresponding to LV-OOA; Aiken et al.,
2008; Zhang et al., 2011) spectra from Paris (<inline-formula><mml:math id="M137" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.97</mml:mn></mml:mrow></mml:math></inline-formula>;
Crippa et al., 2013), Zurich (0.96; Lanz et al., 2007a; Crippa et al., 2013)
and Borneo rainforest (0.99; Robinson et al., 2011) as well as the average
LV-OOA calculated from 15 Northern Hemisphere data sets (0.94; Ng et al.,
2010). Cluster no. 3 is characterised by a high <inline-formula><mml:math id="M138" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 43 Th signal
(<inline-formula><mml:math id="M139" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msup><mml:mi mathvariant="normal">O</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>; Aiken et al., 2008) and correlates with SV-OOA and
OOA-II (Aiken et al., 2008) spectra from Pasadena (0.74; Hersey et al.,
2011), Borneo (0.86; Robinson et al., 2011) and the 15-data-set average
(0.76; Ng et al., 2010) as well as the laboratory-generated SOA spectra
generated from typical pine forest emitted volatile organic compounds (e.g.
<inline-formula><mml:math id="M140" display="inline"><mml:mi mathvariant="italic">α</mml:mi></mml:math></inline-formula>-pinene, 0.81; <inline-formula><mml:math id="M141" display="inline"><mml:mi mathvariant="italic">α</mml:mi></mml:math></inline-formula>-terpinene, 0.83; terpinolene,
0.84; Bahreini et al., 2005). Abiding by the typical naming convention of
AMS-derived aerosol types, we label these species LV-OOA (cluster no. 1) and
SV-OOA (no. 3).</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F4" specific-use="star"><label>Figure 4</label><caption><p id="d1e3163">Final silhouette-weighted reference spectra (coloured bars) and
variabilities (error bars) for the r-CMB model components.</p></caption>
            <?xmltex \igopts{width=497.923228pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f04.png"/>

          </fig>

      <p id="d1e3172">The solution also contains a large cluster (no. 2) with spectra dominated by
ammonium and sulfate ion species. This is in agreement with ammonium
sulfate being a main component of ambient aerosols. Although it also contains
trace amounts of other species, we name the <inline-formula><mml:math id="M142" display="inline"><mml:mrow class="chem"><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>-dominated aerosol class (no. 2) ammonium sulfate (AS) for brevity.</p>
      <p id="d1e3198">The main nitrate-containing spectra are divided into two clusters (no. 6 and
no. 8). The divisive feature seems to be the ratio of <inline-formula><mml:math id="M143" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 46 to 30 Th signals
(i.e. <inline-formula><mml:math id="M144" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">measured</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> in Eq. 7), which is much higher in cluster type
no. 8 (<inline-formula><mml:math id="M145" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.44</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.11</mml:mn></mml:mrow></mml:math></inline-formula>) versus for no. 6 (<inline-formula><mml:math id="M146" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.08</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.07</mml:mn></mml:mrow></mml:math></inline-formula>; P-III; see
Supplement Sect. S5 for error estimate). We note once more that these
characteristic values for clusters are from the final model (P-III; Fig. 4), as outlined before. Based on the literature we interpret the split to
correspond to the division between nitrogen in the form of inorganic (ammonium)
nitrate (AN) and organic nitrogen, matching with previous AMS observations
(Hao et al., 2014; Farmer et al., 2010; Kiendler-Scharr et al., 2016). The
interpretation of cluster no. 8 as AN is additionally corroborated by its
similarity to spectra from pure ammonium nitrate calibration for the
instrument, available in the Supplement (Sect. S6). On average, the brute-force single-particle
(BFSP; Drewnick et al., 2015) AN calibrations
performed for the instrument yielded an <inline-formula><mml:math id="M147" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">calib</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> (Eq. 7) ratio of
<inline-formula><mml:math id="M148" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.49</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.05</mml:mn></mml:mrow></mml:math></inline-formula> (mean <inline-formula><mml:math id="M149" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> standard deviation), while an MS mode
calibration returned an <inline-formula><mml:math id="M150" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">calib</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> of 0.42. Similarly to naming of the AS
class, we use labels organic nitrogen (ON; cluster no. 6) and AN (cluster no. 8) for the nitrate-dominated aerosol types. The ON
cluster is further discussed in Sect. 3.3.2. The label ON was chosen to
differentiate between the (presumably) organic-nitrogen-dominated aerosol
class (ON), and the part of <inline-formula><mml:math id="M151" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> ion species deemed likely to be
organonitrate (<inline-formula><mml:math id="M152" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>).</p>
      <p id="d1e3312">A fraction of the organic signal observed at <inline-formula><mml:math id="M153" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 44 Th for inorganic salt
classes (AS and AN) may be explained by an <inline-formula><mml:math id="M154" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">CO</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> artefact induced
by thermal decomposition of inorganic salts (Pieber et al., 2016). For
ammonium nitrate, the proportion of organic signal at <inline-formula><mml:math id="M155" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 44 Th to total nitrate
signal is 2.9 % (P-III). Pieber et al. (2016) estimate a contribution of
3.4 %, suggesting most of the organic signal observed in AN may arise
from this artefact. This proposition is further discussed in the Supplement
(Sect. S6).</p>
      <p id="d1e3352">Two of the clusters (no. 4 and no. 5) seem related to anthropogenic
(primary) organic aerosol types. Cluster no. 4 has a similar spectrum as the
hydrocarbon-like-organic aerosol (HOA) spectra from the AMS spectral
database (Ulbrich et al., 2009) and closely matches, among others, HOA
reported by Zhang et al. (2005) for Pittsburgh
(<inline-formula><mml:math id="M156" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.91</mml:mn></mml:mrow></mml:math></inline-formula>) and the average of 15 de-convolved HOA
spectra reported by Ng et al. (2010; <inline-formula><mml:math id="M157" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.89</mml:mn></mml:mrow></mml:math></inline-formula>). The
spectra also exhibits high similarity with traffic emission spectra of
diesel bus exhaust (0.86), lubricating oil (0.82) and fuel (0.75), reported
by Canagaratna et al. (2004).</p>
      <?pagebreak page3654?><p id="d1e3389">Cluster no. 5 features high signals for ions typical of biomass burning
organic aerosol (BBOA, e.g. Alfarra et al., 2007) and cooking organic
aerosol (COA, e.g. Mohr et al., 2012). The spectra features the marker
signals of levoglucosan (Cubison et al., 2011; Schneider et al., 2006) at
<inline-formula><mml:math id="M158" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 60 (<inline-formula><mml:math id="M159" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msubsup><mml:mi mathvariant="normal">O</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>) and 73 Th (<inline-formula><mml:math id="M160" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">5</mml:mn></mml:msub><mml:msubsup><mml:mi mathvariant="normal">O</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>)
along with chloride ions (at <inline-formula><mml:math id="M161" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 35 and 36 Th) and a high fraction of signal
at <inline-formula><mml:math id="M162" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 55 Th (<inline-formula><mml:math id="M163" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msup><mml:mi mathvariant="normal">O</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>; Mohr et al., 2012), pointing to
cooking and/or biomass burning emissions. The highest similarities to library
spectra (de-convolved via PMF) are found with COA (Mohr et al., 2012, for
Barcelona, <inline-formula><mml:math id="M164" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.70</mml:mn></mml:mrow></mml:math></inline-formula>; Crippa et al., 2013 for Paris,
<inline-formula><mml:math id="M165" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.59</mml:mn></mml:mrow></mml:math></inline-formula>) and BBOA (e.g. 15-data-set average reported by Ng et
al., 2010, <inline-formula><mml:math id="M166" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.51</mml:mn></mml:mrow></mml:math></inline-formula>) and BBOA de-convolved by Crippa et
al. (2013, for Paris, <inline-formula><mml:math id="M167" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.50</mml:mn></mml:mrow></mml:math></inline-formula>). Similarity to SV-OOA library
samples are also moderately high (e.g. Ng et al., 2010, 15-data-set average,
<inline-formula><mml:math id="M168" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.59</mml:mn></mml:mrow></mml:math></inline-formula>).</p>
      <p id="d1e3582">The differentiation between HOA versus BBOA or COA can often be resolved even
from unit resolution spectra, using the <inline-formula><mml:math id="M169" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">55</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>-to-<inline-formula><mml:math id="M170" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> ratio (Mohr et
al., 2012), and the differences in mass spectral fingerprints higher up on
the <inline-formula><mml:math id="M171" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> axis (resolvable using mass scaling; Äijälä et al.,
2017). However, the distinction between COA and BBOA aerosol types is much
more delicate due to very high unit mass resolution spectral similarity for
higher <inline-formula><mml:math id="M172" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> variables, (e.g. <inline-formula><mml:math id="M173" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.79</mml:mn></mml:mrow></mml:math></inline-formula> for COA and BBOA
reported by Mohr et al., 2012). The main difference between the COA and BBOA
aerosol types is the absolute level signals from levoglocosan fragments, the
quantitative interpretation of which is difficult due to (1) levoglucosan
production being determined by combustion temperature (Shafizadeh, 1984),
(2) levoglucosan originating both from BBOA and COA (Mohr et al., 2012), and
(3) levoglucosan sinks being potentially considerable in the atmosphere
(Hoffmann et al., 2009), which affects transported aerosol in particular. Due
to the remote location of the measurement site and general prevalence of BBOA
over COA in urban aerosol loadings (e.g. Daellenbach et al., 2017) we
conclude that BBOA is more likely the dominant component for this aerosol
type, so we will use the class label “BBOA” for brevity. Due to high
spectral similarity, we find it extremely likely that any COA contribution
would be apportioned to this class, but without the benefit of
high-mass-resolution data, the convolution seems insolvable at this time.</p>
      <p id="d1e3648">Cluster 7 spectrum offers little in terms of unique spectral features, and it
appears as though it could be represented as a combination of the more distinct AS
(no. 2), LV-OOA (no. 1) and ON (no. 6) aerosol types. It is unclear whether this
class represents an actual aerosol chemical type, or whether it is due to
incomplete resolving of the aforementioned species in the PMF model. We note
that the organics part of AS, LV-OOA and ON are all highly oxidised, which may
imply similar levels of aging and thus similar origins for these species. Organic
spectral components are further analysed and discussed in Sect. 3.2.2.</p>
      <p id="d1e3651">Based on this interpretation and evaluation of criteria outlined in
Sect. 2.5, we decided to select the following as the main representative anthropogenic
aerosol types: ammonium sulfate (cluster no. 2, <inline-formula><mml:math id="M174" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula>,
silhouette <inline-formula><mml:math id="M175" display="inline"><mml:mrow><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.91</mml:mn></mml:mrow></mml:math></inline-formula>) ammonium nitrate (no. 8, <inline-formula><mml:math id="M176" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula>, silh <inline-formula><mml:math id="M177" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.48),
hydrocarbon-like organic aerosol (no. 2, <inline-formula><mml:math id="M178" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:math></inline-formula>, silh <inline-formula><mml:math id="M179" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.65) and
biomass burning organic aerosol (no. 5, <inline-formula><mml:math id="M180" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">6</mml:mn></mml:mrow></mml:math></inline-formula>, silh <inline-formula><mml:math id="M181" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.36). The
silhouette<?pagebreak page3655?> values can be taken to represent separation distance from
neighbouring aerosol types. For comparison, silhouette values for some of the
anthropogenic organic aerosol types are available in Äijälä et
al. (2017), but to our knowledge no precedent exists for mixed or inorganic
aerosols. Generally, the more “unique” the spectra of a group and the
higher the within-cluster cohesion, the higher the silhouette.</p>
</sec>
<sec id="Ch1.S3.SS1.SSS2">
  <title>Phase II: classification of biogenic secondary organic
aerosols</title>
      <p id="d1e3740">In the second phase of our analysis, ME-2 factorisations were run for 10
factors for all the data sets. We constrained 4 out of the 10 factors with
the anchors and variabilities for anthropogenic aerosol types, derived from
the previous phase (AS, AN, HOA, BBOA). The resulting 80-factor profiles were
again extracted and classified. The classification solutions featured
generally higher silhouette values than in the first phase, which is at least
partly explained by constrained spectra being forced to conform to their set
limits. The highest total silhouette (0.66) was obtained for 15 clusters (at
<inline-formula><mml:math id="M182" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">2.41</mml:mn></mml:mrow></mml:math></inline-formula>). Again, the inter-solution variability for the solutions
inspected was low for the main classes. The phase II solution is available
in the Supplement (Fig. S4). Overall, the solution very closely resembles the result
from phase I (Fig. 3).</p>
      <p id="d1e3758">The expected LV-OOA (no. 1; <inline-formula><mml:math id="M183" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">14</mml:mn></mml:mrow></mml:math></inline-formula>; silh 0.64) and SV-OOA (no. 3; <inline-formula><mml:math id="M184" display="inline"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">9</mml:mn></mml:mrow></mml:math></inline-formula>;
silh 0.44) aerosol types again rank among the most typical classifications.
Their moderate silhouettes reflect higher variability within these classes,
corresponding to results from earlier studies (e.g. Canonaco et al., 2015),
and/or closer proximity to neighbouring aerosol types, than for the AN, AS
or HOA types. The result may suggest seasonal or other data-set-specific
variability for SOA, which supports partitioning the data on a per-campaign
basis. In accordance with typical AMS organic aerosol classification
conventions laid out by Aiken et al. (2008) for example, we opt for two classes of
oxidised aerosols. We thus select clusters no. 1 and no. 3 (P-II) to
represent LV-OOA and SV-OOA (Aiken et al., 2008; Jimenez et al., 2009)
respectively.</p>
      <p id="d1e3785">For P-III of our analysis, we additionally fix the organic nitrogen class,
(ON, P-II cluster no. 8). Irrespective of the exact chemical composition and
label of this aerosol component, we assess that there is enough literature
support (among others Kiendler-Scharr et al., 2016; Farmer et al., 2010;
Drewnick et al., 2015; Murphy et al., 2007; Hao et al., 2014) for inclusion
of nitrogen-containing aerosol types other than AN to warrant the inclusion
of this class. In any case, the classification of nitrate signal at <inline-formula><mml:math id="M185" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 30 Th
to a distinct class seems statistically robust, as exhibited by its
emergence as a free factor in both P-I and P-II solutions.<?pagebreak page3656?> Due to the
importance of nitrogen-containing species in SOA composition and formation
(e.g. Kiendler-Scharr et al., 2016; Berkemeier et al., 2016) we find it an
important aerosol class to include, examine and further interpret. The mixed
cluster no. 7 also emerges for four data sets, but with notably low silhouette
(0.18), suggestive of low within-cluster cohesion. As we still lack a
distinct chemical interpretation for this class, beyond the hypothesis of
incomplete resolution of aged aerosol species in factorisation, we will not
include the mixed class (no. 7) in our final receptor model.</p>
</sec>
<sec id="Ch1.S3.SS1.SSS3">
  <title>Phase III: final r-CMB receptor model</title>
      <p id="d1e3806">In the final phase (P-III) of constructing our r-CMB receptor model, we used
seven factors which were all constrained with the profiles and allowed
variabilities from the previous phase (P-II, AS, LV-OOA, SV-OOA, BBOA, ON,
HOA, AN). The ME-2 algorithm was tasked with resolving the factors' temporal
behaviour.</p>
      <p id="d1e3809">To derive final characteristic spectra for the model components, as well as
to study the variability of spectra in the solutions, we once more applied
the same clustering procedure and silhouette analysis as for previous
phases. The maximal structure (silh 0.85) was achieved for the seven-cluster
solution (<inline-formula><mml:math id="M186" display="inline"><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi mathvariant="normal">m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">1.81</mml:mn></mml:mrow></mml:math></inline-formula>), which was to be expected considering ME-2
was run with seven rather strictly constrained factors in this phase. With
silhouette weighting applied, we obtain the final spectra and variabilities
(Fig. 4). We note that this final clustering and weighting step mainly serves
to provide an estimate of variability within each aerosol type but also
yields final spectra to be used as library references for the outcome of
this work. Details of the solution of the r-CMB model are discussed in
following sections, from the perspective of mass attribution (Sect. 3.2.1)
and spectral characteristics (Sect. 3.2.2). Diurnal cycles of the
components for the entirety of data are available in the Supplement (Fig. S12). Due
to the rural setting of the site and the generally long transport times of
aerosol before reaching the site, diurnal cycles for the various aerosol
types are not as characteristic as they would be for urban measurements (for
example temporal trends of HOA and BBOA). Also due to seasonal differences, the
variability between data sets is considerable, resulting in high uncertainty
in interpretation. The daily cycles are likely a mixed product of source
emissions, boundary layer dynamics and aerosol temperature response. While
of interest, disentangling these processes is beyond the topic of this
study.</p>
</sec>
</sec>
<sec id="Ch1.S3.SS2">
  <title>Overview of r-CMB model results</title>
<sec id="Ch1.S3.SS2.SSS1">
  <title>Mass attribution and “default” AMS chemical speciation for r-CMB
components</title>
      <p id="d1e3839">Tabulation of final explained variations (EVs; Paatero, 2000; Canonaco et
al., 2013) for the r-CMB model is shown in Table 3. The seven-component
r-CMB model explains <inline-formula><mml:math id="M187" display="inline"><mml:mrow><mml:mn mathvariant="normal">83</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">8</mml:mn></mml:mrow></mml:math></inline-formula> % of the variation in loadings, when
variation from low-SNR variables is included, and <inline-formula><mml:math id="M188" display="inline"><mml:mrow><mml:mn mathvariant="normal">97</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:math></inline-formula> % when
only residuals of variables with SNR <inline-formula><mml:math id="M189" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula> are considered. The
components with lowest loadings (ON, HOA, AN) explain around 4 % to 5 % of
variation, which seems to roughly match the general rule of thumb of PMF–ME-2 being able to extract components of around 5 % of contribution
(Ulbrich et al., 2009).</p>

<?xmltex \floatpos{p}?><table-wrap id="Ch1.T3" specific-use="star"><label>Table 3</label><caption><p id="d1e3879">Explained variations (EV, in percent) for the r-CMB model.</p></caption>
  <?xmltex \igopts{width=441.017717pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-t03.png"/>
</table-wrap>

      <?xmltex \floatpos{p}?><fig id="Ch1.F5" specific-use="star"><label>Figure 5</label><caption><p id="d1e3889">“Default” chemical speciation for r-CMB components: mass
loadings <bold>(a)</bold> and relative contributions <bold>(b)</bold> of default
species in components. Apportionment of default species to r-CMB components
by mass <bold>(c)</bold> and relative contribution <bold>(d)</bold>.</p></caption>
            <?xmltex \igopts{width=469.470472pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f05.png"/>

          </fig>

      <p id="d1e3911">Model results for campaign VIII, especially regarding BBOA, are very
different from other data sets, including the other cold season results
available in data set III, for example (Fig. S5). Upon closer examination, we
attribute the VIII anomaly at least partly to pronounced surface ionisation
effects, discussed more in Sect. 3.4. While we consider the r-CMB results
for campaign VIII too unreliable for use in models or further studies, we
decided not to omit data set VIII, since other AMS data are likely also
affected by the same processes, albeit to a lesser degree. The attribution
of anomalies to exact processes is very difficult, and surface ionisation
effects remain hard to quantify. We hope that reporting our results in full
also furthers the discussion of surface ionisation in the AMS, and
potentially helps other AMS users observing similar observations.</p>
      <p id="d1e3914">The composition of our r-CMB components is shown in Fig. 5b, and the same in
absolute mass units in panel (a). The opposite visualisation,
i.e. attribution of default species into r-CMB components, is similarly given
for absolute mass concentration and relative units in Fig. 5c and d. Unlike
mass spectral variables and estimated EV, where signals at <inline-formula><mml:math id="M190" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> are in units
“nitrate equivalent mass” (RIE not applied), all mass concentrations
reported are corrected for relative ionisation efficiency (see Supplement,
Sect. S4).</p>
      <p id="d1e3929">Generally, the separation between the inorganic r-CMB components (AS, AN)
and organics (LV-OOA, SV-OOA, BBOA, HOA) seems clear (Fig. 5). Ammonium
nitrate and sulfate components consist primarily of inorganic ion species
(81 % to 84 %), while for organic components the inorganic ion species
contribution is small (LV-OOA: 8 %, SV-OOA: 8 %, BBOA: 6 %, HOA:
3 %). However, extensive oxidation of organics in aerosol typically
results in the formation of organic acids (Yatavelli et al., 2015; Vogel et al.,
2013; Duplissy et al., 2011), and we hypothesise that organic salt formation with
[<inline-formula><mml:math id="M191" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>] could account for the notable 5 % mass contribution of
ammonium to this aerosol type.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F6" specific-use="star"><label>Figure 6</label><caption><p id="d1e3947">Mass attribution in the default AMS speciation scheme <bold>(a)</bold>
and by r-CMB components <bold>(b)</bold> for all eight data sets combined. Values
are (data set length-weighted) averages for all data combined. Absolute mass
concentrations are in units (<inline-formula><mml:math id="M192" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>g m<inline-formula><mml:math id="M193" display="inline"><mml:msup><mml:mi/><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula>).</p></caption>
            <?xmltex \igopts{width=341.433071pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f06.png"/>

          </fig>

      <?pagebreak page3658?><p id="d1e3982">Explanations for the observed mixing of ion species can include (1) mixed
emission profiles at sources, variabilities within a source type, as well as
collocation of sources; (2) atmospheric processes, such as mass transfer
between the species by evaporation, condensation (e.g. Ye et al., 2016) or
coagulation; and (3) PMF or r-CMB modelling uncertainties. We will discuss the
relative ratios and neutralisation balances of inorganic ion species in
Sect. 3.3.2, in relation to inorganic salt formation scheme. The interesting
exception to the rather clear-cut ion species separation is the ON component,
which contains 40 % of <inline-formula><mml:math id="M194" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> species ions, and 41 % of
ions defined as organic. The possible interpretations
for this distribution are further discussed in Sect. 3.3.2</p>
      <p id="d1e3997">As for the organics–inorganics division, the two speciations (default vs.
r-CMB) give similar results (Fig. 6). For all the data sets combined, the
default organic ion species (“org”) explains an average 57 % of total
aerosol mass at the site. Similarly, combining the mass of all
organic-dominated components (LV-OOA, SV-OOA, BBOA, HOA and ON) results in
60 % mass fraction versus 40 % explained by ammonium nitrate
(5 %) and ammonium sulfate (35 %) salts. The per-data-set mass
apportionment is presented in the Supplement (Fig. S9).</p>
</sec>
<sec id="Ch1.S3.SS2.SSS2">
  <title>Spectral characteristics of organic components</title>
      <p id="d1e4006">As discussed above, despite the mixing observed, the inorganic aerosol
classes generally seem separate from organic aerosols. The scaled
correlation values between inorganic and organic spectra are extremely low
(Supplement Sect. S8, Tables S1 and S2), indicating near-zero similarity and
clear-cut separation between the inorganic and organic aerosol types by the
clustering algorithm. For inter-correlations between the organics-dominated
aerosol classes, the picture is somewhat more complex.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F7" specific-use="star"><label>Figure 7</label><caption><p id="d1e4011"><bold>(a)</bold> P-III (r-CMB) solution – cluster projections onto a
<inline-formula><mml:math id="M195" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">55</mml:mn></mml:msub><mml:mo>/</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (Mohr et al., 2012), O : C (estimated, Aiken et al., 2008)
plane. Circles correspond to the members of the cluster and the cross markers
to cluster centroids. The text markers indicate respective positions of
anthropogenic organic aerosol types from Äijälä et al. (2017).
Marker size indicates organic mass fraction in spectra. Axes are truncated.
<bold>(b)</bold> P-III solution, projected onto the <inline-formula><mml:math id="M196" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">44</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M197" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">43</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> plane
(i.e. the “Sally's triangle” plot; Ng et al., 2011). Circles correspond to
objects in clusters and the cross markers to cluster centroids. Marker size
indicates organic mass fraction in spectra. A dotted line marks the area
where most laboratory data for organic aerosol falls (Ng et al., 2010).</p></caption>
            <?xmltex \igopts{width=369.885827pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f07.png"/>

          </fig>

      <p id="d1e4065">To understand the drivers for the separation of the organic aerosol types, we
visualised the phase I (unconstrained PMF) and phase III (r-CMB)
classification results with a projection of the clustering solutions onto a
plane defined by an axis corresponding to estimated oxidation level and
another connected to source type (P-III in Fig. 7; P-I available in the
Supplement, Fig. S6). Similar to Äijälä et al. (2017), we
describe the oxidation level of the organic fraction of each component using
the oxygen-to-carbon ratio (O : C) parameterisation of Aiken et al. (2008),
and use the ratio of <inline-formula><mml:math id="M198" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> : <inline-formula><mml:math id="M199" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> to imply source type. The O : C
generally separates LV-OOA and SV-OOA species from each other and from the
fresher aerosol classes. The <inline-formula><mml:math id="M200" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">55</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> : <inline-formula><mml:math id="M201" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> ratio is typically used
for differentiation between HOA and COA or BBOA (Mohr et al., 2012) but
equally seems to set apart the biogenic SOA types from the anthropogenic
aerosols (Äijälä et al., 2017). This is due to the low signal of
<inline-formula><mml:math id="M202" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula>  57 Th, a typical anthropogenic spectral marker, originating from
<inline-formula><mml:math id="M203" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msubsup><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">9</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M204" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">5</mml:mn></mml:msub><mml:msup><mml:mi mathvariant="normal">O</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula> compounds (Mohr et al.,
2012; Zhang et al., 2005).</p>
      <p id="d1e4164">The LV-OOA aerosol type, characterised by the dominant <inline-formula><mml:math id="M205" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 44 and 28 Th
signals, is usually considered a highly oxidised aerosol type that results
from the oxidation of SV-OOA and various fresh emissions (among others
Canonaco et al., 2015). The <inline-formula><mml:math id="M206" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">55</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> : <inline-formula><mml:math id="M207" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> ratio of LV-OOA is
considerably lower than for SV-OOA in both solutions, indicating the
inclusion of other sources beyond the <inline-formula><mml:math id="M208" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>-poor biogenic SOA
contribution. SV-OOA, on the other hand, has the highest
<inline-formula><mml:math id="M209" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">55</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> : <inline-formula><mml:math id="M210" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> ratio of the classes, hinting at the predominantly
biogenic origin of the SV-OOA at the site. The difference is further
amplified for phase II and III solutions compared to the unconstrained PMF.
We hypothesise that this change can result from improved differentiation
between SV-OOA and the BBOA species (in P-II), as these aerosol types may be
difficult to separate initially due to similar oxidation level and features
of the spectra (<inline-formula><mml:math id="M211" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.34</mml:mn></mml:mrow></mml:math></inline-formula>; Table S3). The SV-OOA is
characterised by the non-oxygen-containing ions at <inline-formula><mml:math id="M212" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 29, 43 and 55 Th
(Mohr et al., 2009), as well as mass-to-charge <inline-formula><mml:math id="M213" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 53 Th signal
(<inline-formula><mml:math id="M214" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msubsup><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">5</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>) typical of boreal forest biogenic backgrounds (e.g.
Corrigan et al., 2013). The <inline-formula><mml:math id="M215" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup><mml:mo>/</mml:mo><mml:msup><mml:mi mathvariant="normal">NO</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula> ratio of 0.10 for
nitrate-containing SV-OOA reported by Hao et al. (2014) matches our
observations for the nitrates in SV-OOA (<inline-formula><mml:math id="M216" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup><mml:mo>/</mml:mo><mml:msup><mml:mi mathvariant="normal">NO</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula> of <inline-formula><mml:math id="M217" display="inline"><mml:mrow><mml:mn mathvariant="normal">0.11</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.15</mml:mn></mml:mrow></mml:math></inline-formula>; Eqs. 7 and S5). This may indicate the presence of organonitrate
species in the SV-OOA factor.</p>
      <p id="d1e4348">We also projected the P-I and P-III solutions to the (<inline-formula><mml:math id="M218" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">44</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M219" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">43</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>)
plane (P-III in Fig. 7; P-I in the Supplement, Fig. S6), to produce a result
comparable to the triangle plot by Ng et al. (2010). The result indicates a
clear separation between the low and semi-volatile aerosol types, as well as
the primary combustion aerosols (HOA, BBOA), and the spectral shifts<?pagebreak page3659?> from
phase 1 “bulk PMF” results to those of the final r-CMB model.</p>
      <p id="d1e4373">As stated in Sect. 3.1, the spectra of BBOA and HOA aerosol types match
the previously published observations. The HOA spectrum is characterised by
the ion series <inline-formula><mml:math id="M220" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> (<inline-formula><mml:math id="M221" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 29, 43, 57, 71, 85, 99 Th etc.) and
<inline-formula><mml:math id="M222" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> (<inline-formula><mml:math id="M223" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 41, 55, 69, 83, 97 Th etc.) resulting from alkanes and
aromatics from traffic emissions (diesel exhaust, lubricating oil; Chirico
et al., 2010; Mohr et al., 2009; Canagaratna et al., 2004). The biomass
burning organic aerosol levoglucosan marker signals at <inline-formula><mml:math id="M224" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 60
(<inline-formula><mml:math id="M225" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msubsup><mml:mi mathvariant="normal">O</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>) and 73 Th (<inline-formula><mml:math id="M226" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">5</mml:mn></mml:msub><mml:msubsup><mml:mi mathvariant="normal">O</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>)
(Cubison et al., 2011; Schneider et al., 2006; Elsasser et al., 2012) are
clearly identifiable in the BBOA spectra (Figs. 3, 4) and set this class apart from HOA and
SV-OOA with some similar features. The contribution of often biogenic signals
at <inline-formula><mml:math id="M227" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 53 Th is also lower for BBOA than for the biogenic, semi-volatile SOA.
The pronounced signal from aromatic rings (tropyllium cation
<inline-formula><mml:math id="M228" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">7</mml:mn></mml:msub><mml:msubsup><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">7</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>) at <inline-formula><mml:math id="M229" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 91 Th is a typical result of fragmentation of
aromatic hydrocarbon compounds (Lindon et al., 2016). As stated previously,
we presume the BBOA class also encompasses any COA contributions, which are
likely unresolvable as a separate class due to high spectral similarity
(0.79; Sect. 3.1.1).</p>
      <p id="d1e4547">In terms of spectral characteristics, the organic contributions of AS and AN
classes fall somewhere between the distinct organic classes and offer little
in terms of significant organic markers. Notably, the organics in the ON
class exhibit some of the characteristics of LV-OOA and feature generally
high <inline-formula><mml:math id="M230" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">44</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. This may indicate a high degree of oxidation of the organics
for this aerosol type (Aiken et al., 2008). However, alternative plausible
interpretations exist: AMS response from oxidation products of amine
compounds and amine-nitrate salts feature similarly high <inline-formula><mml:math id="M231" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">44</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (Murphy et
al., 2007) as does a typical amine fragment ion <inline-formula><mml:math id="M232" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">6</mml:mn></mml:msub><mml:msup><mml:mi mathvariant="normal">N</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>
(McLafferty and Turecek, 1993). Furthermore, as discussed in Sect. 3.3.2, an
equally plausible explanation would be inorganic nitrate salts such as
<inline-formula><mml:math id="M233" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">KNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> (from biomass burning for example; Li et al., 2003)
contributing to this class in the form of the Pieber et al. (2016) thermal
decomposition artefact. The contribution of <inline-formula><mml:math id="M234" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 55 and 57 Th signals to the
ON species are both low and the ratio 1.37 of <inline-formula><mml:math id="M235" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">55</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> : <inline-formula><mml:math id="M236" display="inline"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mn mathvariant="normal">57</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> is much
lower than for the biogenic aerosol species. Without more detailed analysis,
and due to the uncertainties surrounding the origins of this aerosol type
(Sect. 3.3.2), it is difficult to say with any certainty if this is due to
anthropogenic nature of this aerosol, or for example due to fragmentation
pattern of characteristic organic compounds in this aerosol type.</p>
</sec>
</sec>
<sec id="Ch1.S3.SS3">
  <title>Comparisons with reference methods</title>
<sec id="Ch1.S3.SS3.SSS1">
  <title>Comparison with “traditional” ME-2 analysis for aerosol organic
component</title>
      <p id="d1e4652">In order to evaluate the performance of the source apportionment approach
presented in this study for organic aerosol, we compare our results to
results only relying on the organic mass spectral fingerprints. Specifically,
two data sets covered in this study (data sets II and III; Table 1) were also
included in the Crippa et al. (2014) analysis, which allows us to compare
factorisation results directly. We chose to compare the Crippa et al. (2014)
results to ours from data set II. We note that while there are minor
differences in the<?pagebreak page3660?> pre-processing and corrections for data covered in Crippa
et al. (2014), the factorisation input is very similar in both cases. The
ME-2 model used by Crippa and co-workers included only the organic spectra
and apportioned its mass to four factors: LV-OOA, SV-OOA, BBOA and HOA. The
latter two components were constrained using a HOA profile from an urban
aerosol study in Paris (Crippa et al., 2013) and an average BBOA of those
extracted for Mexico City, Mexico, and Houston, USA (Ng et al., 2011). The
allowed variability around these anchors for all variables (<inline-formula><mml:math id="M237" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula>) was
5 % (HOA) and 30 % (BBOA).</p>
      <p id="d1e4667">We compared the solutions for Crippa et al. (2014) factorisation to our r-CMB
model solution data set II, both for loadings (Fig. 8) and profiles (Fig. 9).
Generally the solutions correlated highly – the loadings (<inline-formula><mml:math id="M238" display="inline"><mml:mi mathvariant="bold">F</mml:mi></mml:math></inline-formula>) and
profiles (<inline-formula><mml:math id="M239" display="inline"><mml:mi mathvariant="bold">G</mml:mi></mml:math></inline-formula>) for LV-OOA (<inline-formula><mml:math id="M240" display="inline"><mml:mi mathvariant="bold">F</mml:mi></mml:math></inline-formula>: <inline-formula><mml:math id="M241" display="inline"><mml:mrow><mml:msup><mml:mi>r</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.92</mml:mn></mml:mrow></mml:math></inline-formula>; <inline-formula><mml:math id="M242" display="inline"><mml:mi mathvariant="bold">G</mml:mi></mml:math></inline-formula>:
<inline-formula><mml:math id="M243" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.96</mml:mn></mml:mrow></mml:math></inline-formula>) and SV-OOA (<inline-formula><mml:math id="M244" display="inline"><mml:mi mathvariant="bold">F</mml:mi></mml:math></inline-formula>: 0.94; <inline-formula><mml:math id="M245" display="inline"><mml:mi mathvariant="bold">G</mml:mi></mml:math></inline-formula>: 0.99)
agreed the closest, whilst the HOA also had high similarities (<inline-formula><mml:math id="M246" display="inline"><mml:mi mathvariant="bold">F</mml:mi></mml:math></inline-formula>:
0.85; <inline-formula><mml:math id="M247" display="inline"><mml:mi mathvariant="bold">G</mml:mi></mml:math></inline-formula>: 88). The BBOA factor or component correlated markedly
less (<inline-formula><mml:math id="M248" display="inline"><mml:mi mathvariant="bold">F</mml:mi></mml:math></inline-formula>: 0.63; <inline-formula><mml:math id="M249" display="inline"><mml:mi mathvariant="bold">G</mml:mi></mml:math></inline-formula>: 0.42), which we hypothesise to be due
to differences in the anchors used, COA likely attributed to this class, high
spectral similarity between SV-OOA and BBOA, and the generally low loadings
of BBOA observed at SMEAR II.</p>

      <?xmltex \floatpos{p}?><fig id="Ch1.F8" specific-use="star"><label>Figure 8</label><caption><p id="d1e4776">Time series comparison of aerosol organic component with Crippa et
al. (2014) for the September 2008 campaign (data set II). For comparability,
only the organic part of r-CMB model components are considered. Data from
this work have been averaged to 1 h resolution. Organics in other r-CMB
components (AS, AN, ON) are taken into account for the total amount but not
shown separately. Discrepancy in total organics loading is due to differences
in pre-processing values (e.g. ionisation efficiency, collection
efficiency).</p></caption>
            <?xmltex \igopts{width=369.885827pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f08.png"/>

          </fig>

      <?xmltex \floatpos{t}?><fig id="Ch1.F9" specific-use="star"><label>Figure 9</label><caption><p id="d1e4788">Comparison of organic part of spectra with Crippa et al. (2014) for
data set II. The r-CMB model results from this study are shown in colour, and
the Crippa et al. (2014) spectra in black. For comparability, the Crippa et
al. (2014) spectra were corrected for a difference in fragmentation tables
used (included <inline-formula><mml:math id="M250" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 28 Th, updated to modern calculation of <inline-formula><mml:math id="M251" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 16, 17 and
18 Th organic signals) and total signal subsequently re-normalised to unity.
Spectra similarity is evaluated using Pearson's squared correlation
coefficients: unscaled (<inline-formula><mml:math id="M252" display="inline"><mml:mrow><mml:msup><mml:mi>r</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>) and with mass scaling (<inline-formula><mml:math id="M253" display="inline"><mml:mrow><mml:msubsup><mml:mi>r</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula>).</p></caption>
            <?xmltex \igopts{width=369.885827pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f09.png"/>

          </fig>

      <p id="d1e4845">The discrepancy in distribution of absolute mass for the LV-OOA and SV-OOA
components, indicated by the sub-unity slope, suggests the r-CMB model
attributes a part of the organic mass from the SOA factors into BBOA, AS, AN
and ON components, while HOA is represented rather identically in both
models. A difference in mass distribution between the results is to be
expected, considering the r-CMB model allows for organics in seven
components, while the model of Crippa et al. (2014) model only comprises four
components. Generally, we take the similar results of the methods, as shown
by the high correlation values, to indicate that inclusion of inorganics in
the model does not significantly perturb modelling of the organics. We also
note the r-CMB components included (HOA BBOA, LV-OOA, SV-OOA) are
predominantly composed of organics (92 % to 97 %; Fig. 5), and the
four components presented comprise 82 % of total organics.</p>
</sec>
<sec id="Ch1.S3.SS3.SSS2">
  <title>Comparison of inorganic salt and organic nitrogen results with
reference methods</title>
      <p id="d1e4854">To evaluate the inorganic mass apportionment result, we compared the
loadings from the r-CMB solution against the result from the inorganics
apportionment scheme (Sect. 2.4.1). The comparison, again performed for
data set II, is presented in Fig. 10. We additionally compared the r-CMB
ON component loadings with <inline-formula><mml:math id="M254" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> mass estimate from the
Kiendler-Scharr parameterisation (Eq. 7; Sect. 2.4.2).</p>

      <?xmltex \floatpos{p}?><fig id="Ch1.F10" specific-use="star"><label>Figure 10</label><caption><p id="d1e4870">Comparison of Inorganics apportionment methods (r-CMB and ion
balance scheme. The estimates from the ion balance scheme (Sect. 2.4.1) are
shown in black, and the r-CMB model results in colour. The linear fits (right
panels) represent the data poorly due to high amount of zero-value points and
outliers.</p></caption>
            <?xmltex \igopts{width=426.791339pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f10.png"/>

          </fig>

      <p id="d1e4879">The loadings for the (r-CMB) AS component compare well with the combined
<inline-formula><mml:math id="M255" display="inline"><mml:mrow><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">HSO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow><mml:mo>+</mml:mo><mml:mrow class="chem"><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow><mml:mo>+</mml:mo><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:mrow></mml:math></inline-formula>
loading, indicating ammonium(bi)sulfate is described similarly by both models
(<inline-formula><mml:math id="M256" display="inline"><mml:mrow><mml:msup><mml:mi>r</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.92</mml:mn></mml:mrow></mml:math></inline-formula>). We assume the r-CMB AS component to be comprised of both
<inline-formula><mml:math id="M257" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">HSO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M258" display="inline"><mml:mrow class="chem"><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, which would very likely
be classified together due to their high spectral
similarity. For ammonium nitrate the correlation between loadings is very low
(<inline-formula><mml:math id="M259" display="inline"><mml:mrow><mml:msup><mml:mi>r</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.16</mml:mn></mml:mrow></mml:math></inline-formula>). Looking at the time series, the reason seems to be that the
speciation scheme-based model often predicts a total absence of AN, due to a
high amount of sulfate in aerosol. While the r-CMB model also generally
estimates loadings to be low, they are clearly non-zero in the r-CMB model.
We take the result to reflect the assumption of complete and instantaneous
internal and external mixing of aerosol in the speciation scheme
(Sect. 2.4.1).</p>
      <p id="d1e5001">The loading prediction for organic nitrogen by the speciation scheme model
is similarly event-driven and the model results do not correlate. This is
caused by the nitrate assignment to organonitrate class when not explained
by <inline-formula><mml:math id="M260" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>. Same can be said for the excess <inline-formula><mml:math id="M261" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> class, which
corresponds to the <inline-formula><mml:math id="M262" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> species in the other, mostly organic r-CMB
factors, principally the LV-OOA; the ion balance scheme predicts zero
concentration for many of the data points, an estimate not matching with the
r-CMB-based result.</p>
      <p id="d1e5043">On these differences between the models, we note that the ion-balance-based
apportionment scheme is sensitive to small changes in <inline-formula><mml:math id="M263" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>
concentrations, especially for data with generally low <inline-formula><mml:math id="M264" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>
concentrations, such as ours. A simple sensitivity estimate, available in the
Supplement (Sect. S4), was performed for data set III. The result indicates
that a 33 % change in RIE<inline-formula><mml:math id="M265" display="inline"><mml:msub><mml:mi/><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:msub></mml:math></inline-formula> changes the component mass
concentrations on average 5 % for AS, 56 % for AN, 66 % for
orgNO3 and 164 % for excess_NH4 components. On the other hand, the r-CMB
model is rather insensitive to error in RIE estimates, since (1) the spectra
in factorisation and clustering have the variables' signals in
“<inline-formula><mml:math id="M266" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> equivalent mass concentration” units, which is not (yet)
corrected for RIE of different species; (2) mass scaling causes low mass
signals such as <inline-formula><mml:math id="M267" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> fragments (<inline-formula><mml:math id="M268" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 15 to 17 Th) to weight less
(relative to higher <inline-formula><mml:math id="M269" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> variables) for determining the solution; and
(3) <inline-formula><mml:math id="M270" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> seems not to be an unique marker of any of the classes. We
therefore suggest a factorisation-based model such as the r-CMB model
presented here is much more robust for resolving speciation of inorganic
aerosol components. The sensitivity test (Supplement, Sect. S4) also
indicates that the temporal differences between the ion balance scheme and
r-CMB are not explained by a difference in RIE<inline-formula><mml:math id="M271" display="inline"><mml:msub><mml:mi/><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:msub></mml:math></inline-formula>. Thus, the
reasons for the discrepancies are more likely related to the unrealistic
assumptions of the inorganics apportionment model.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F11" specific-use="star"><label>Figure 11</label><caption><p id="d1e5154">Comparison of Kiendler-Scharr parameterisation (Kiendler-Scharr et
al., 2016; black line; moving median filter for 11 points window applied;
<inline-formula><mml:math id="M272" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">calib</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.42</mml:mn></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M273" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.1</mml:mn></mml:mrow></mml:math></inline-formula>) for organonitrate with
<inline-formula><mml:math id="M274" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> ion species in ON factor from our r-CMB model (in colour).</p></caption>
            <?xmltex \igopts{width=426.791339pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f11.png"/>

          </fig>

      <?pagebreak page3662?><p id="d1e5208">In addition to deriving organic nitrogen mass from the ion balance scheme,
we compared the r-CMB-derived ON loading with the Kiendler-Scharr method for
estimating the orgNO3 mass loading (Eq. 6). The comparison, shown in
Fig. 11, indicates that the two methods produce a very similar result for
organic nitrogen mass (<inline-formula><mml:math id="M275" display="inline"><mml:mrow><mml:msup><mml:mi>r</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.94</mml:mn></mml:mrow></mml:math></inline-formula>). The discrepancy in absolute mass
is likely explained by the difference in the ratio values (<inline-formula><mml:math id="M276" display="inline"><mml:mi>R</mml:mi></mml:math></inline-formula>) used for
Eq. (6) parameterisation, and those featured in the r-CMB AN and ON
components (<inline-formula><mml:math id="M277" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">AN</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.44</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.11</mml:mn></mml:mrow></mml:math></inline-formula>; <inline-formula><mml:math id="M278" display="inline"><mml:mrow><mml:msub><mml:mi>R</mml:mi><mml:mi mathvariant="normal">ON</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.08</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">0.07</mml:mn></mml:mrow></mml:math></inline-formula>;
P-III, Eq. S5).</p>
      <p id="d1e5271">The similarity to Kiendler-Scharr parameterisation result does seem to
support the interpretation of a nitrogen component in ON as organonitrate
(<inline-formula><mml:math id="M279" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">orgNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>). Some similarities in temporal behaviour between the ON component
and (non-quantitative) <inline-formula><mml:math id="M280" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">K</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula> ions were observed, potentially suggesting
thermal ionisation of Potassium salts (e.g. <inline-formula><mml:math id="M281" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">KNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula>) might contribute an
unknown fraction to ON (Supplement, Sect. S11). Also, 63 % of chloride ions
species associate with the ON component. The reason is unclear, and although
chloride signals were very low in general, we cannot rule out that some of
the ON component could still be explained by other chemical compositions
than organonitrate.</p>
      <?pagebreak page3664?><p id="d1e5307">The <inline-formula><mml:math id="M282" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> : org ratio of our ON factor is close to unity (Fig. 5),
while for example Farmer et al. (2010) report a nitrogen-to-carbon ratio of 0.04,
and oxygen-to-carbon of 0.25 for AMS spectra of organonitrate standards.
However, several factors are likely to affect the <inline-formula><mml:math id="M283" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> : org ratio
observable in atmospheric ON factorisations. Firstly, two different pathways
for organonitrates exist: (i) the primarily daytime reactions of organic
peroxy radicals with NO (Orlando and Tyndall, 2012), and (ii) the
<inline-formula><mml:math id="M284" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>-radical-initiated oxidation of unsaturated compounds during
night-time (Peräkylä et al., 2014). While the nitrate functionality
in all these reactions is identical, the organic part can be vastly
different, as peroxy radicals are formed in almost all atmospheric oxidation
reactions, irrespective of oxidant (e.g. OH or ozone) or VOC (biogenic or
anthropogenic). Therefore, it is not to be expected that a specific organic
spectrum should be linked to the organic nitrate functionality. Secondly, as
described by Lee et al. (2016) for example, the particle-phase lifetime of
organonitrates is of the order of hours with respect to hydrolysis. This
reaction will convert the nitrate functionality to nitric acid, while the
organic part remains intact, except for the conversion of the -<inline-formula><mml:math id="M285" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">ONO</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>
group to -OH. This conversion will only have a small impact on the
volatility of the organic molecule (e.g. Kroll and Seinfeld, 2008), while
the nitric acid may well evaporate in the fairly low-ammonia boreal forest
environment. Taken together, the diverse formation pathways as well as the
atmospheric processing are likely to cause ON spectra retrieved from ambient
air factorisations to look different from, for example, freshly formed organic
aerosol from organonitrate standards, such as those used by Farmer et al. (2010). We therefore avoid putting too much emphasis on the organic parts
observed in our ON factor.</p>
</sec>
</sec>
<sec id="Ch1.S3.SS4">
  <title>Outlier observations</title>
      <p id="d1e5361">During the course of our analysis we encountered some anomalous observations
likely stemming from surface ionisation effects, i.e. molecules being
thermally ionised at the heater surface rather than at the ionisation region
by electron impact. A thorough review and discussion of AMS-related surface
ionisation effects was recently published by Drewnick et al. (2015). Drewnick
et al. (2015) emphasise that the division between refractory and
non-refractory aerosol is not binary, and there exist a number of
semi-refractory compounds that the AMS can measure, albeit
non-quantitatively.</p>

      <?xmltex \floatpos{t}?><fig id="Ch1.F12" specific-use="star"><label>Figure 12</label><caption><p id="d1e5366">Spectra of outlier clusters (no. 9 to no. 17) for P-I. The spectra
for these outlier classes were omitted from our analysis due to not meeting
the criteria of (1) occurrence and/or (2) interpretability (on an acceptable
level). Despite their mostly speculative value, many of them feature some
chemically interesting characteristics, potentially pointing to the presence of
amines (signals at <inline-formula><mml:math id="M286" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 58, 86 and 100 Th; clusters no. 9, no. 11 and
no. 17), alkali metals (<inline-formula><mml:math id="M287" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">85</mml:mn></mml:msup><mml:mi mathvariant="normal">Rb</mml:mi></mml:mrow></mml:math></inline-formula>, <inline-formula><mml:math id="M288" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">87</mml:mn></mml:msup><mml:mi mathvariant="normal">Rb</mml:mi></mml:mrow></mml:math></inline-formula>; no. 10), cycloalkanes
(signals at series <inline-formula><mml:math id="M289" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 69, 79, 81, 95, 107 and 109 Th; no. 16) and organic
sulfate (signal at <inline-formula><mml:math id="M290" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 80, 81 Th; no. 13, no. 17), as well as effects of
surface ionisation (<inline-formula><mml:math id="M291" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">41</mml:mn></mml:msup><mml:msup><mml:mi mathvariant="normal">K</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>; <inline-formula><mml:math id="M292" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">39</mml:mn></mml:msup><mml:msup><mml:mi mathvariant="normal">K</mml:mi><mml:mrow><mml:mo>+</mml:mo><mml:mo>+</mml:mo><mml:mo>+</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>; no. 10, no. 17)
and a likely artefact from poor air-beam correction (signal at <inline-formula><mml:math id="M293" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 29 Th;
no. 12).</p></caption>
          <?xmltex \igopts{width=483.69685pt}?><graphic xlink:href="https://acp.copernicus.org/articles/19/3645/2019/acp-19-3645-2019-f12.png"/>

        </fig>

      <p id="d1e5483">Our observations on extracted “outlier” PMF factors from the different
phases of analysis match well with the finding and calculations of Drewnick
et al. (2015), as well as other similar AMS observations published. In Fig. 12, we present the outlier clusters from phase I classification solution
that were excluded from further analysis due to a low number of occurrences
or/and questionable interpretability. The emergence of most of these spectra
are likely attributable to over-resolution or questionable separation of
the main PMF factors, due to setting the number of PMF factors to 10. Despite
their questionable value for the main analysis, we find they contain many
potentially interesting mass spectral features and seem not to emerge by
chance. Below we will present some hypotheses on their possible
interpretation.</p>
<sec id="Ch1.S3.SS4.SSS1">
  <title>Surface ionisation and data correction artefacts</title>
      <p id="d1e5491">Drewnick et al. (2015) note that the main semi-refractory elements eligible
for ionisation in the AMS are Cd (<inline-formula><mml:math id="M294" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 112 Th), Cs (132 Th), Hg (200 Th), K
(39 Th), Na (23 Th), Rb (85 Th) and Se (79 Th). The proneness of potassium
(K) and sodium (Na) for non-quantitative thermal ionisation effects in the
AMS is well known (e.g. Allan et al., 2003a), which is also why they are
excluded from AMS (quantitative) data analysis. Although the main potassium
isotope is omitted, the <inline-formula><mml:math id="M295" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">41</mml:mn></mml:msup><mml:mi mathvariant="normal">K</mml:mi></mml:mrow></mml:math></inline-formula> isotope (with 6.7 % relative
abundance; Haynes, 2014) is not, and a correction is applied
in fragmentation table instead. The K-derived signals were especially
prominent in data set VIII (see Supplement Fig. S7), with contributions of 1
to 2 order of magnitudes higher than the highest well-behaving signals such
as <inline-formula><mml:math id="M296" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 44 Th or 48 Th. We hypothesise the strong signals at <inline-formula><mml:math id="M297" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 41 Th
observable in many of the outlier spectra (clusters no. 10, no. 15 and
no. 17) may be due to insufficient accuracy of the <inline-formula><mml:math id="M298" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">41</mml:mn></mml:msup><mml:mi mathvariant="normal">K</mml:mi></mml:mrow></mml:math></inline-formula> isotope
correction.</p>
      <p id="d1e5554">A similar data processing/correction artefact is likely seen in cluster
no. 12 with a lone, dominant signal at <inline-formula><mml:math id="M299" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 29 Th. This mass-to-charge ratio is a
problematic one for lower-resolution AMS data due to the contribution of
a <inline-formula><mml:math id="M300" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">29</mml:mn></mml:msup><mml:msub><mml:mi mathvariant="normal">N</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> isotopic peak, and location on the slope of the
enormous <inline-formula><mml:math id="M301" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">N</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> peak at <inline-formula><mml:math id="M302" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 28 Th. Although the signal at <inline-formula><mml:math id="M303" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 29 Th is corrected
for the (measured) isotope contribution, even a slight mismatch in the
correction results in notable error in the estimation of the organic signal
fraction at <inline-formula><mml:math id="M304" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 29 Th. We attribute this problem specifically to the scarce
availability of filters for the earliest sets of data.</p><?xmltex \hack{\newpage}?>
</sec>
<?pagebreak page3665?><sec id="Ch1.S3.SS4.SSS2">
  <title>Alkali metals</title>
      <p id="d1e5640">The prominent signals at <inline-formula><mml:math id="M305" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 85 and 87 Th for cluster no. 10 correspond to
rubidium alkali metal ions, and their respective ratios (<inline-formula><mml:math id="M306" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 85 Th
signal : <inline-formula><mml:math id="M307" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 87 Th signal <inline-formula><mml:math id="M308" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 73.2 : 26.8) to what we would expect
based on isotopic distribution of Rb observed in nature
(<inline-formula><mml:math id="M309" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">85</mml:mn></mml:msup><mml:mi mathvariant="normal">Rb</mml:mi></mml:mrow></mml:math></inline-formula> : <inline-formula><mml:math id="M310" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi/><mml:mn mathvariant="normal">87</mml:mn></mml:msup><mml:mi mathvariant="normal">Rb</mml:mi></mml:mrow></mml:math></inline-formula> <inline-formula><mml:math id="M311" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 72.2 % : 27.8 %; Haynes,
2014). Examination of the raw mass spectrum, available in Sect. S12, also
supports rubidium as a likely candidate. Unlike for the potassium signal, the
temporal behaviour of the factors corresponding to cluster no. 10 is highly
plume-like. Preliminary analysis of wind direction shows the plume direction
to correspond to the arrival direction from the district heating plant
(co-located with a sawmill and a pellet factory) at Juupajoki, 5 km due
south-east (Supplement, Sect. S12). Similar observations of rubidium from
coal burning were previously published by Irei et al. (2014). It seems likely
that this aerosol class would originate from the heating plant.</p><?xmltex \hack{\newpage}?>
</sec>
<sec id="Ch1.S3.SS4.SSS3">
  <title>Organic nitrogen and sulfur</title>
      <p id="d1e5725">As for the signals often attributed to amines at 86 and 100 Th, (Mclafferty,
1959), featured in cluster no. 11, in the absence of alternative explanation for
the 100 and 86 signals, we are inclined to believe they actually represent
atmospheric amines. The cluster spectrum corresponds also to the spectra of
pollution plumes, extracted for data sets I to III in our previous study on
pollution events (Äijälä et al., 2017). We note that amines are also
reported to be prone to surface ionisation, and for example trimethylamine is
thermally ionised above temperatures 300 <inline-formula><mml:math id="M312" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C, with high thermal
ionisation efficiency at 600 <inline-formula><mml:math id="M313" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C (50 % of the maximum efficiency
observed at around 350 <inline-formula><mml:math id="M314" display="inline"><mml:msup><mml:mi/><mml:mo>∘</mml:mo></mml:msup></mml:math></inline-formula>C; Rasulev and Zandberg, 1988). It thus
seems plausible that surface ionisation effects could contribute to the amine
observations as well. In our earlier work (Äijälä et al., 2017),
we also attributed a similar spectral signal at <inline-formula><mml:math id="M315" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 58 Th to amines
(<inline-formula><mml:math id="M316" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">8</mml:mn></mml:msub><mml:msup><mml:mi mathvariant="normal">N</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>). However, in light of the recent results of Drewnick
et al. (2015) on surface ionisation of NaCl, and the detachment of
the <inline-formula><mml:math id="M317" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 58 Th signal from the class of other amine-attributed signals at 86 and
100 Th, another plausible explanation for the <inline-formula><mml:math id="M318" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 58 Th<?pagebreak page3666?> signal observed in
clusters no. 9, no. 11, no. 16 and no. 17 exists. Namely, we find it
plausible that such a spectrum would arise from surface ionisation of sodium
chloride and thus represent atmospheric <inline-formula><mml:math id="M319" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">NaCl</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>.</p>
      <p id="d1e5824">Clusters no. 13, no. 15 and no. 16 are interesting from the viewpoint of
organonitrates and sulfates. Nitrate signal in clusters no. 15 and no. 16
is composed mostly of <inline-formula><mml:math id="M320" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 30 Th signal, with negligible <inline-formula><mml:math id="M321" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 46 Th contribution.
With the high organic contribution, this would make these classes potential
candidates for containing organonitrates. However, an equally plausible
explanation is the surface ionisation of <inline-formula><mml:math id="M322" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">KNO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, discussed previously.
The pronounced signals at <inline-formula><mml:math id="M323" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 80 and/or 81 Th featured in clusters no. 13,
no. 14 and no. 17 are likely explained by humidity-induced fragmentation
changes in the ionisation of sulfate species, (particularly <inline-formula><mml:math id="M324" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> and
<inline-formula><mml:math id="M325" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">3</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>; Drewnick et al., 2015). We do note that organosulfur-containing
samples characterised by Farmer at al. (2010) also feature an increased ratio
of <inline-formula><mml:math id="M326" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 80 and 81 Th signals compared to <inline-formula><mml:math id="M327" display="inline"><mml:mrow class="chem"><mml:mo>(</mml:mo><mml:msub><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub><mml:msub><mml:mo>)</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:msub><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula>, so we cannot
rule out organic sulfate contribution.</p>
</sec>
<sec id="Ch1.S3.SS4.SSS4">
  <title>Cycloalkanes</title>
      <p id="d1e5943">Finally, we wish to draw attention to the ion series of cluster no. 16, with
prominent organic signals at 69, 79, 81, 95, 107 and 109 Th, which have been connected to
cycloalkanes (McLafferty and Turecek, 1993; Alfarra et al., 2004).
Cycloalkanes are common in lubricating oils for example (Liang et al., 2018),
which are an important, even dominant, component in traffic emissions (Worton
et al., 2014). The closest literature match on ambient observations we found
was the study of Takami et al. (2007), where they observed similar high
concentrations of mass-to-charge 95, 107 and 109 Th, as well as 58 and 85 Th,
but were unable to attribute the observation to a specific source.</p>
</sec>
</sec>
</sec>
<sec id="Ch1.S4" sec-type="conclusions">
  <title>Conclusions</title>
      <p id="d1e5954">We performed a synthesis analysis on eight AMS data sets from a boreal
forest site and constructed a data-driven chemical mass balance type of
receptor model, with relaxed constraints on the component profiles (r-CMB).
Notably, the data comprised both inorganic and organic aerosol components.
The resulting seven-component model explained <inline-formula><mml:math id="M328" display="inline"><mml:mrow><mml:mn mathvariant="normal">83</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">8</mml:mn></mml:mrow></mml:math></inline-formula> % of variability
in data (<inline-formula><mml:math id="M329" display="inline"><mml:mrow><mml:mn mathvariant="normal">96</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">3</mml:mn></mml:mrow></mml:math></inline-formula> % with low-SNR variables excluded). The model
components for the SMEAR II boreal forest site were as follows, in order of average
aerosol mass contribution: ammonium sulfate (<inline-formula><mml:math id="M330" display="inline"><mml:mrow><mml:mn mathvariant="normal">35</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula> %; mean mass
fraction <inline-formula><mml:math id="M331" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> standard deviation over data sets), LV-OOA (<inline-formula><mml:math id="M332" display="inline"><mml:mrow><mml:mn mathvariant="normal">27</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">8</mml:mn></mml:mrow></mml:math></inline-formula> %), SV-OOA (<inline-formula><mml:math id="M333" display="inline"><mml:mrow><mml:mn mathvariant="normal">12</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula> %), BBOA (<inline-formula><mml:math id="M334" display="inline"><mml:mrow><mml:mn mathvariant="normal">11</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">7</mml:mn></mml:mrow></mml:math></inline-formula> %), organic nitrogen
(<inline-formula><mml:math id="M335" display="inline"><mml:mrow><mml:mn mathvariant="normal">7</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula> %), ammonium nitrate (<inline-formula><mml:math id="M336" display="inline"><mml:mrow><mml:mn mathvariant="normal">5</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">2</mml:mn></mml:mrow></mml:math></inline-formula> %) and HOA (<inline-formula><mml:math id="M337" display="inline"><mml:mrow><mml:mn mathvariant="normal">3</mml:mn><mml:mo>±</mml:mo><mml:mn mathvariant="normal">1</mml:mn></mml:mrow></mml:math></inline-formula> %).</p>
      <p id="d1e6073">Remarkably, organic nitrogen seems to be a larger component than ammonium nitrate
for the site. However, ambiguity remains in the interpretation of the
organic nitrogen class as organonitrate, prompting caution against casual
use of the <inline-formula><mml:math id="M338" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> : <inline-formula><mml:math id="M339" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">NO</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula> fragmentation ratio as a sole organonitrate
proxy. COA was not resolved separately, presumably due to high spectral
similarity with BBOA and low mass contribution to SMEAR II aerosol and is
most likely included to the BBOA component. Other minor aerosol groups that
were not included in the model feature characteristics potentially
indicative of amine-dominated aerosols, coal combustion aerosol with alkali
metals (rubidium, cesium), and hints of cycloalkanes and
organosulfates. We presume many of these observations may arise from
surface ionisation processes, and as such they may not be currently
quantifiable in mass. Their corroboration, quantification and connection to
emission sources or thermal ionisation effects require further study.</p>
      <p id="d1e6100">We suggest inorganics should be routinely included in factorisation of AMS
data due to the high demand of such data in aerosol models. We wish
specifically to point out that adding the inorganic information is easy and
only requires application of the same tried-and-tested data processing and uses
the same error model as for organics. While inclusion of inorganics does
diminish the relative weight organics carry in the analysis and thus may
hinder extraction organic factors comprising very low fraction (<inline-formula><mml:math id="M340" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:math></inline-formula> %) of total mass (Ulbrich et al., 2009), we argue that the added
information value of inorganic speciation makes up for this. Compared to
organics-only analyses, inclusion of inorganic data increases direct
usability of AMS data for physicochemical aerosol models. We also
demonstrate that factorisation-based speciation provides a speciation that is more
realistic, robust, and less assumption-dependant and calibration-sensitive than
simplistic ion balance schemes.</p>
      <p id="d1e6113">The classification methods presented here for evaluating factor analysis
output can also be useful in applications that produce large
quantities of discrete aerosol spectral data, such as deriving factorisation
error estimates via bootstrapping analysis (Osborne et al., 2014; Brown et
al., 2015). With further development, we find it likely that a two-step analysis
(exploratory factorisation <inline-formula><mml:math id="M341" display="inline"><mml:mo>+</mml:mo></mml:math></inline-formula> classification <inline-formula><mml:math id="M342" display="inline"><mml:mo>→</mml:mo></mml:math></inline-formula> r-CMB) would be a
viable option for increasingly unsupervised and less analyst-biased AMS data
analysis.</p>
      <p id="d1e6131">We would also encourage further development of combined statistical methods
for improved mass spectral feature extraction and parameterisation for mass
spectra, as they will enable future machine-learning applications for data
analysis. Drawing from the comprehensive information available on current
size-resolved aerosol mass spectrometric data, it seems likely that advanced
machine-learning methods (such as data reduction combined with predictive
neural networking, e.g. Burns and Whitesides, 1993; Gasteiger and Zupan,
1993) will likely provide new, improved ways to model aerosol
physicochemical properties like hygroscopicity, volatility and optics in the
near future.</p>
</sec>

      
      </body>
    <back><notes notes-type="dataavailability"><title>Data availability</title>

      <p id="d1e6139">The AMS r-CMB data presented in this study are available
online (Äijälä et al., 2019). The r-CMB component profiles will
additionally be made available in the AMS spectral database
(<uri>http://cires1.colorado.edu/jimenez-group/AMSsd/</uri>, last access: 18 March
2019) upon publication.</p>
  </notes><app-group>
        <supplementary-material position="anchor"><p id="d1e6145">The supplement related to this article is available online at: <inline-supplementary-material xlink:href="https://doi.org/10.5194/acp-19-3645-2019-supplement" xlink:title="pdf">https://doi.org/10.5194/acp-19-3645-2019-supplement</inline-supplementary-material>.</p></supplementary-material>
        </app-group><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d1e6154">Contributor roles (shown in italics) corresponding to the taxonomy of CASRAI's CRediT
definitions (<uri>https://casrai.org/credit/</uri>, last access: 18 March 2019)
are as follows:
<list list-type="bullet"><list-item>
      <p id="d1e6162"><italic>Conceptualisation</italic>. MÄ and ME formulated the study.</p></list-item><list-item>
      <p id="d1e6168"><italic>Investigation and data curation</italic>. MÄ, HJ and ME collected and curated the
experimental data.</p></list-item><list-item>
      <p id="d1e6174"><italic>Formal analysis, methodology, visualisation</italic>. MÄ, supported by KRD, designed and performed the
statistical analysis and data visualisations.</p></list-item><list-item>
      <p id="d1e6180"><italic>Validation</italic>. MÄ, KRD and LH reviewed the
data quality and reproducibility.</p></list-item><list-item>
      <p id="d1e6186"><italic>Software, methodology</italic>. FC designed and supported the SoFi
analysis software.</p></list-item><list-item>
      <p id="d1e6192"><italic>Writing</italic>. MÄ wrote the original draft, which was reviewed, commented and edited
by all the authors.</p></list-item><list-item>
      <p id="d1e6198"><italic>Funding acquisition, resources, project administration, supervision</italic>. ME, MK, ASHP, and TP  supported and
supervised the research.</p></list-item></list></p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d1e6206">The authors declare that they have no conflict of interest.</p>
  </notes><ack><title>Acknowledgements</title><p id="d1e6212">We wish to thank the technical staff at INAR and SMEAR II (Pasi Aalto, Erkki Siivola, Heikki Laakso, Toivo Pohja, Veijo Hiltunen and Janne Levula) for
valuable support during the years 2008–2010 in acquiring the data sets
analysed here. We thank Douglas Worsnop for pioneering work in
starting the AMS studies at University of Helsinki, and the valuable
insightful discussions on AMS data analysis and interpretation. We also
gratefully acknowledge the friendly support staff at Aerodyne Research
(especially Donna Sueper and Leah Williams) for their help on data
analytical questions.</p><p id="d1e6214">The research was supported by the following programs: the European
Commission FP6 projects EUCAARI (036833-2), FP7 ACTRIS (262254), the Horizon
2020 project ACTRIS-2 (654109), ERC Grant COALA (638703), the Finnish COE
project CRAICC (272041) and the Academy of Finland COE in Atmospheric
Science (2008–2019).<?xmltex \hack{\newline}?><?xmltex \hack{\newline}?>
Edited by: Dominick Spracklen<?xmltex \hack{\newline}?>
Reviewed by: two anonymous referees</p></ack><ref-list>
    <title>References</title>

      <ref id="bib1.bib1"><label>1</label><mixed-citation>Äijälä, M., Heikkinen, L., Fröhlich, R., Canonaco, F.,
Prévôt, A. S. H., Junninen, H., Petäjä, T., Kulmala, M.,
Worsnop, D., and Ehn, M.: Resolving anthropogenic aerosol pollution types –
deconvolution and exploratory classification of pollution events, Atmos.
Chem. Phys., 17, 3165–3197, <ext-link xlink:href="https://doi.org/10.5194/acp-17-3165-2017" ext-link-type="DOI">10.5194/acp-17-3165-2017</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib2"><label>2</label><mixed-citation>Äijälä, M., Daellenbach, K. R., Canonaco, F., Heikkinen, L.,
Junninen, H., Petäjä, T., Kulmala, M., Prévôt, A. S. H., and
Ehn, M.: Aerosol chemical composition results for SMEAR II 2008–2011 from
r-CMB model results, available at:
<uri>https://etsin.avointiede.fi/dataset/urn-nbn-fi-csc-kata20190319160233052956</uri>,
last access: 19 March 2019.</mixed-citation></ref>
      <ref id="bib1.bib3"><label>3</label><mixed-citation>Aiken, A. C., DeCarlo, P. F., and Jimenez, J. L.: Elemental analysis of
organic species with electron ionization high-resolution mass spectrometry,
Anal. Chem., 79, 8350–8358, <ext-link xlink:href="https://doi.org/10.1021/ac071150w" ext-link-type="DOI">10.1021/ac071150w</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib4"><label>4</label><mixed-citation>Aiken, A. C., Decarlo, P. F., Kroll, J. H., Worsnop, D. R., Huffman, J. A.,
Docherty, K. S., Ulbrich, I. M., Mohr, C., Kimmel, J. R., Sueper, D., Sun,
Y., Zhang, Q., Trimborn, A., Northway, M., Ziemann, P. J., Canagaratna, M.
R., Onasch, T. B., Alfarra, M. R., Prevot, A. S., Dommen, J., Duplissy, J.,
Metzger, A., Baltensperger, U., and Jimenez, J. L.: O <inline-formula><mml:math id="M343" display="inline"><mml:mo>/</mml:mo></mml:math></inline-formula> C and OM <inline-formula><mml:math id="M344" display="inline"><mml:mo>/</mml:mo></mml:math></inline-formula> OC
ratios of primary, secondary, and ambient organic aerosols with
high-resolution time-of-flight aerosol mass spectrometry, Environ. Sci.
Technol., 42, 4478–4485, 2008.</mixed-citation></ref>
      <ref id="bib1.bib5"><label>5</label><mixed-citation>Alfarra, M. R., Coe, H., Allan, J. D., Bower, K. N., Boudries, H.,
Canagaratna, M. R., Jimenez, J. L., Jayne, J. T., Garforth, A. A., Li, S. M.,
and Worsnop, D. R.: Characterization of urban and rural organic particulate
in the lower Fraser valley using two aerodyne aerosol mass spectrometers,
Atmos. Environ., 38, 5745–5758, <ext-link xlink:href="https://doi.org/10.1016/j.atmosenv.2004.01.054" ext-link-type="DOI">10.1016/j.atmosenv.2004.01.054</ext-link>, 2004.</mixed-citation></ref>
      <ref id="bib1.bib6"><label>6</label><mixed-citation>
Alfarra, M. R., Prevot, A. S., Szidat, S., Sandradewi, J., Weimer, S., Lanz,
V. A., Schreiber, D., Mohr, M., and Baltensperger, U.: Identification of the
mass spectral signature of organic aerosols from wood burning emissions,
Environ. Sci. Technol., 41, 5770–5777, 2007.</mixed-citation></ref>
      <ref id="bib1.bib7"><label>7</label><mixed-citation>Allan, J. D., Alfarra, M. R., Bower, K. N., Williams, P. I., Gallagher, M.
W., Jimenez, J. L., McDonald, A. G., Nemitz, E., Canagaratna, M. R., and
Jayne, J. T.: Quantitative sampling using an Aerodyne aerosol mass
spectrometer 2. Measurements of fine particulate chemical composition in two
UK cities, J. Geophys. Res.-Atmos., 108, 4091, <ext-link xlink:href="https://doi.org/10.1029/2002JD002359" ext-link-type="DOI">10.1029/2002JD002359</ext-link>,
2003a.</mixed-citation></ref>
      <ref id="bib1.bib8"><label>8</label><mixed-citation>Allan, J. D., Jimenez, J. L., Williams, P. I., Alfarra, M. R., Bower, K. N.,
Jayne, J. T., Coe, H., and Worsnop, D. R.: Quantitative sampling using an
Aerodyne aerosol mass spectrometer 1. Techniques of data interpretation and
error analysis, J. Geophys. Res.-Atmos., 108, 4090,
<ext-link xlink:href="https://doi.org/10.1029/2002JD002358" ext-link-type="DOI">10.1029/2002JD002358</ext-link>, 2003b.</mixed-citation></ref>
      <ref id="bib1.bib9"><label>9</label><mixed-citation>
Allan, J. D., Delia, A. E., Coe, H., Bower, K. N., Alfarra, M. R., Jimenez,
J. L., Middlebrook, A. M., Drewnick, F., Onasch, T. B., and Canagaratna, M.
R.: A generalised method for the extraction of chemically resolved mass
spectra from Aerodyne aerosol mass spectrometer data, J. Aerosol Sci., 35,
909–922, 2004.</mixed-citation></ref>
      <ref id="bib1.bib10"><label>10</label><mixed-citation>Allan, J. D., Alfarra, M. R., Bower, K. N., Coe, H., Jayne, J. T., Worsnop,
D. R., Aalto, P. P., Kulmala, M., Hyötyläinen, T., Cavalli, F., and
Laaksonen, A.: Size and composition measurements of background aerosol and
new particle growth in a Finnish forest<?pagebreak page3668?> during QUEST 2 using an Aerodyne
Aerosol Mass Spectrometer, Atmos. Chem. Phys., 6, 315–327,
<ext-link xlink:href="https://doi.org/10.5194/acp-6-315-2006" ext-link-type="DOI">10.5194/acp-6-315-2006</ext-link>, 2006.</mixed-citation></ref>
      <ref id="bib1.bib11"><label>11</label><mixed-citation>Arthur, D. and Vassilvitskii, S.: <inline-formula><mml:math id="M345" display="inline"><mml:mi>k</mml:mi></mml:math></inline-formula>-means<inline-formula><mml:math id="M346" display="inline"><mml:mrow><mml:mo>+</mml:mo><mml:mo>+</mml:mo></mml:mrow></mml:math></inline-formula>: The advantages of careful
seeding, Proceedings of the eighteenth annual ACM-SIAM symposium on Discrete
algorithms, New Orleans, Louisiana, USA, 7–9 January 2007, 1027–1035, 2007.</mixed-citation></ref>
      <ref id="bib1.bib12"><label>12</label><mixed-citation>Bahreini, R., Keywood, M. D., Ng, N. L., Varutbangkul, V., Gao, S., Flagan,
R. C., Seinfeld, J. H., Worsnop, D. R., and Jimenez, J. L.: Measurements of
secondary organic aerosol from oxidation of cycloalkenes, terpenes, and
m-xylene using an Aerodyne aerosol mass spectrometer, Environ. Sci. Technol.,
39, 5674–5688, <ext-link xlink:href="https://doi.org/10.1021/es048061a" ext-link-type="DOI">10.1021/es048061a</ext-link>, 2005.</mixed-citation></ref>
      <ref id="bib1.bib13"><label>13</label><mixed-citation>
Ball, G. H. and Hall, D. J.: ISODATA, a novel method of data analysis and
pattern classification, DTIC Document, Technical report, Stanford research
institute, Menlo Park, CA, USA, 1965.</mixed-citation></ref>
      <ref id="bib1.bib14"><label>14</label><mixed-citation>Berkemeier, T., Ammann, M., Mentel, T. F., Pöschl, U., and Shiraiwa, M.:
Organic nitrate contribution to new particle formation and growth in
secondary organic aerosols from <inline-formula><mml:math id="M347" display="inline"><mml:mi mathvariant="italic">α</mml:mi></mml:math></inline-formula>-pinene ozonolysis, Environ. Sci.
Technol., 50, 6334–6342, 2016.</mixed-citation></ref>
      <ref id="bib1.bib15"><label>15</label><mixed-citation>
Bilde, M., Barsanti, K., Booth, M., Cappa, C. D., Donahue, N. M.,
Emanuelsson, E. U., McFiggans, G., Krieger, U. K., Marcolli, C., and Topping,
D.: Saturation vapor pressures and transition enthalpies of low-volatility
organic molecules of atmospheric relevance: from dicarboxylic acids to
complex mixtures, Chem. Rev., 115, 4115–4156, 2015.</mixed-citation></ref>
      <ref id="bib1.bib16"><label>16</label><mixed-citation>
Brown, S. G., Eberly, S., Paatero, P., and Norris, G. A.: Methods for
estimating uncertainty in PMF solutions: Examples with ambient air and water
quality data and guidance on reporting PMF results, Sci. Total Environ., 518,
626–635, 2015.</mixed-citation></ref>
      <ref id="bib1.bib17"><label>17</label><mixed-citation>
Burns, J. A. and Whitesides, G. M.: Feed-forward neural networks in
chemistry: mathematical systems for classification and pattern recognition,
Chem. Rev., 93, 2583–2601, 1993.</mixed-citation></ref>
      <ref id="bib1.bib18"><label>18</label><mixed-citation>Canagaratna, M. R., Jayne, J. T., Ghertner, D. A., Herndon, S., Shi, Q.,
Jimenez, J. L., Silva, P. J., Williams, P., Lanni, T., Drewnick, F.,
Demerjian, K. L., Kolb, C. E., and Worsnop, D. R.: Chase studies of
particulate emissions from in-use New York City vehicles, Aerosol Sci. Tech.,
38, 555–573, <ext-link xlink:href="https://doi.org/10.1080/02786820490465504" ext-link-type="DOI">10.1080/02786820490465504</ext-link>, 2004.</mixed-citation></ref>
      <ref id="bib1.bib19"><label>19</label><mixed-citation>Canagaratna, M. R., Jayne, J. T., Jimenez, J. L., Allan, J. D., Alfarra, M.
R., Zhang, Q., Onasch, T. B., Drewnick, F., Coe, H., Middlebrook, A., Delia,
A., Williams, L. R., Trimborn, A. M., Northway, M. J., DeCarlo, P. F., Kolb,
C. E., Davidovits, P., and Worsnop, D. R.: Chemical and microphysical
characterization of ambient aerosols with the aerodyne aerosol mass
spectrometer, Mass Spectrom. Rev., 26, 185–222, <ext-link xlink:href="https://doi.org/10.1002/mas.20115" ext-link-type="DOI">10.1002/mas.20115</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib20"><label>20</label><mixed-citation>Canonaco, F., Crippa, M., Slowik, J. G., Baltensperger, U., and
Prévôt, A. S. H.: SoFi, an IGOR-based interface for the efficient use
of the generalized multilinear engine (ME-2) for the source apportionment:
ME-2 application to aerosol mass spectrometer data, Atmos. Meas. Tech., 6,
3649–3661, <ext-link xlink:href="https://doi.org/10.5194/amt-6-3649-2013" ext-link-type="DOI">10.5194/amt-6-3649-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib21"><label>21</label><mixed-citation>Canonaco, F., Slowik, J. G., Baltensperger, U., and Prévôt, A. S. H.:
Seasonal differences in oxygenated organic aerosol composition: implications
for emissions sources and factor analysis, Atmos. Chem. Phys., 15,
6993–7002, <ext-link xlink:href="https://doi.org/10.5194/acp-15-6993-2015" ext-link-type="DOI">10.5194/acp-15-6993-2015</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib22"><label>22</label><mixed-citation>Chirico, R., DeCarlo, P. F., Heringa, M. F., Tritscher, T., Richter, R.,
Prévôt, A. S. H., Dommen, J., Weingartner, E., Wehrle, G., Gysel, M.,
Laborde, M., and Baltensperger, U.: Impact of aftertreatment devices on
primary emissions and secondary organic aerosol formation potential from
in-use diesel vehicles: results from smog chamber experiments, Atmos. Chem.
Phys., 10, 11545–11563, <ext-link xlink:href="https://doi.org/10.5194/acp-10-11545-2010" ext-link-type="DOI">10.5194/acp-10-11545-2010</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib23"><label>23</label><mixed-citation>Corrigan, A. L., Russell, L. M., Takahama, S., Äijälä, M., Ehn,
M., Junninen, H., Rinne, J., Petäjä, T., Kulmala, M., Vogel, A. L.,
Hoffmann, T., Ebben, C. J., Geiger, F. M., Chhabra, P., Seinfeld, J. H.,
Worsnop, D. R., Song, W., Auld, J., and Williams, J.: Biogenic and biomass
burning organic aerosol in a boreal forest at Hyytiälä, Finland,
during HUMPPA-COPEC 2010, Atmos. Chem. Phys., 13, 12233–12256,
<ext-link xlink:href="https://doi.org/10.5194/acp-13-12233-2013" ext-link-type="DOI">10.5194/acp-13-12233-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib24"><label>24</label><mixed-citation>Crippa, M., DeCarlo, P. F., Slowik, J. G., Mohr, C., Heringa, M. F., Chirico,
R., Poulain, L., Freutel, F., Sciare, J., Cozic, J., Di Marco, C. F.,
Elsasser, M., Nicolas, J. B., Marchand, N., Abidi, E., Wiedensohler, A.,
Drewnick, F., Schneider, J., Borrmann, S., Nemitz, E., Zimmermann, R.,
Jaffrezo, J.-L., Prévôt, A. S. H., and Baltensperger, U.: Wintertime
aerosol chemical composition and source apportionment of the organic fraction
in the metropolitan area of Paris, Atmos. Chem. Phys., 13, 961–981,
<ext-link xlink:href="https://doi.org/10.5194/acp-13-961-2013" ext-link-type="DOI">10.5194/acp-13-961-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib25"><label>25</label><mixed-citation>Crippa, M., Canonaco, F., Lanz, V. A., Äijälä, M., Allan, J. D.,
Carbone, S., Capes, G., Ceburnis, D., Dall'Osto, M., Day, D. A., DeCarlo, P.
F., Ehn, M., Eriksson, A., Freney, E., Hildebrandt Ruiz, L., Hillamo, R.,
Jimenez, J. L., Junninen, H., Kiendler-Scharr, A., Kortelainen, A.-M.,
Kulmala, M., Laaksonen, A., Mensah, A. A., Mohr, C., Nemitz, E., O'Dowd, C.,
Ovadnevaite, J., Pandis, S. N., Petäjä, T., Poulain, L., Saarikoski,
S., Sellegri, K., Swietlicki, E., Tiitta, P., Worsnop, D. R., Baltensperger,
U., and Prévôt, A. S. H.: Organic aerosol components derived from 25
AMS data sets across Europe using a consistent ME-2 based source
apportionment approach, Atmos. Chem. Phys., 14, 6159–6176,
<ext-link xlink:href="https://doi.org/10.5194/acp-14-6159-2014" ext-link-type="DOI">10.5194/acp-14-6159-2014</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib26"><label>26</label><mixed-citation>Cubison, M. J., Ortega, A. M., Hayes, P. L., Farmer, D. K., Day, D., Lechner,
M. J., Brune, W. H., Apel, E., Diskin, G. S., Fisher, J. A., Fuelberg, H. E.,
Hecobian, A., Knapp, D. J., Mikoviny, T., Riemer, D., Sachse, G. W.,
Sessions, W., Weber, R. J., Weinheimer, A. J., Wisthaler, A., and Jimenez, J.
L.: Effects of aging on organic aerosol from open biomass burning smoke in
aircraft and laboratory studies, Atmos. Chem. Phys., 11, 12049–12064,
<ext-link xlink:href="https://doi.org/10.5194/acp-11-12049-2011" ext-link-type="DOI">10.5194/acp-11-12049-2011</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib27"><label>27</label><mixed-citation>Daellenbach, K. R., Stefenelli, G., Bozzetti, C., Vlachou, A., Fermo, P.,
Gonzalez, R., Piazzalunga, A., Colombi, C., Canonaco, F., Hueglin, C.,
Kasper-Giebl, A., Jaffrezo, J.-L., Bianchi, F., Slowik, J. G., Baltensperger,
U., El-Haddad, I., and Prévôt, A. S. H.: Long-term chemical analysis
and organic aerosol source apportionment at nine sites in central Europe:
source identification and uncertainty assessment, Atmos. Chem. Phys., 17,
13265–13282, <ext-link xlink:href="https://doi.org/10.5194/acp-17-13265-2017" ext-link-type="DOI">10.5194/acp-17-13265-2017</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib28"><label>28</label><mixed-citation>Drewnick, F., Hings, S. S., DeCarlo, P., Jayne, J. T., Gonin, M., Fuhrer, K.,
Weimer, S., Jimenez, J. L., Demerjian, K. L., Borrmann, S., and Worsnop, D.
R.: A new time-of-flight aerosol mass spectrometer (TOF-AMS) –<?pagebreak page3669?> Instrument
description and first field deployment, Aerosol Sci. Tech., 39, 637–658,
<ext-link xlink:href="https://doi.org/10.1080/02786820500182040" ext-link-type="DOI">10.1080/02786820500182040</ext-link>, 2005.</mixed-citation></ref>
      <ref id="bib1.bib29"><label>29</label><mixed-citation>Drewnick, F., Diesch, J.-M., Faber, P., and Borrmann, S.: Aerosol mass
spectrometry: particle–vaporizer interactions and their consequences for the
measurements, Atmos. Meas. Tech., 8, 3811–3830,
<ext-link xlink:href="https://doi.org/10.5194/amt-8-3811-2015" ext-link-type="DOI">10.5194/amt-8-3811-2015</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib30"><label>30</label><mixed-citation>Duplissy, J., DeCarlo, P. F., Dommen, J., Alfarra, M. R., Metzger, A.,
Barmpadimos, I., Prevot, A. S. H., Weingartner, E., Tritscher, T., Gysel, M.,
Aiken, A. C., Jimenez, J. L., Canagaratna, M. R., Worsnop, D. R., Collins, D.
R., Tomlinson, J., and Baltensperger, U.: Relating hygroscopicity and
composition of organic aerosol particulate matter, Atmos. Chem. Phys., 11,
1155–1165, <ext-link xlink:href="https://doi.org/10.5194/acp-11-1155-2011" ext-link-type="DOI">10.5194/acp-11-1155-2011</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib31"><label>31</label><mixed-citation>Elsasser, M., Crippa, M., Orasche, J., DeCarlo, P. F., Oster, M., Pitz, M.,
Cyrys, J., Gustafson, T. L., Pettersson, J. B. C., Schnelle-Kreis, J.,
Prévôt, A. S. H., and Zimmermann, R.: Organic molecular markers and
signature from wood combustion particles in winter ambient aerosols: aerosol
mass spectrometer (AMS) and high time-resolved GC-MS measurements in
Augsburg, Germany, Atmos. Chem. Phys., 12, 6113–6128,
<ext-link xlink:href="https://doi.org/10.5194/acp-12-6113-2012" ext-link-type="DOI">10.5194/acp-12-6113-2012</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bib32"><label>32</label><mixed-citation>Farmer, D. K., Matsunaga, A., Docherty, K. S., Surratt, J. D., Seinfeld, J.
H., Ziemann, P. J., and Jimenez, J. L.: Response of an aerosol mass
spectrometer to organonitrates and organosulfates and implications for
atmospheric chemistry, P. Natl. Acad. Sci. USA, 107, 6670–6675,
<ext-link xlink:href="https://doi.org/10.1073/pnas.0912340107" ext-link-type="DOI">10.1073/pnas.0912340107</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib33"><label>33</label><mixed-citation>
Fortier, J. and Solomon, H.: Clustering procedures, in: Multivariate
Analysis, edited by: Krishnaiah, P. R., 493–506, Academic Press, New York,
USA, 1966.</mixed-citation></ref>
      <ref id="bib1.bib34"><label>34</label><mixed-citation>Fountoukis, C. and Nenes, A.: ISORROPIA II: a computationally efficient
thermodynamic equilibrium model for
<inline-formula><mml:math id="M348" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">K</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M349" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">Ca</mml:mi><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M350" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">Mg</mml:mi><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M351" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NH</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M352" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">Na</mml:mi><mml:mo>+</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M353" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">SO</mml:mi><mml:mn mathvariant="normal">4</mml:mn><mml:mrow><mml:mn mathvariant="normal">2</mml:mn><mml:mo>-</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M354" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">NO</mml:mi><mml:mn mathvariant="normal">3</mml:mn><mml:mo>-</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M355" display="inline"><mml:mrow class="chem"><mml:msup><mml:mi mathvariant="normal">Cl</mml:mi><mml:mo>-</mml:mo></mml:msup></mml:mrow></mml:math></inline-formula>–<inline-formula><mml:math id="M356" display="inline"><mml:mrow class="chem"><mml:msub><mml:mi mathvariant="normal">H</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msub><mml:mi mathvariant="normal">O</mml:mi></mml:mrow></mml:math></inline-formula>
aerosols, Atmos. Chem. Phys., 7, 4639–4659,
<ext-link xlink:href="https://doi.org/10.5194/acp-7-4639-2007" ext-link-type="DOI">10.5194/acp-7-4639-2007</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib35"><label>35</label><mixed-citation>Freutel, F., Drewnick, F., Schneider, J., Klimach, T., and Borrmann, S.:
Quantitative single-particle analysis with the Aerodyne aerosol mass
spectrometer: development of a new classification algorithm and its
application to field data, Atmos. Meas. Tech., 6, 3131–3145,
<ext-link xlink:href="https://doi.org/10.5194/amt-6-3131-2013" ext-link-type="DOI">10.5194/amt-6-3131-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib36"><label>36</label><mixed-citation>
Friedlander, S. K.: Chemical element balances and identification of air
pollution sources, Environ. Sci. Technol., 7, 235–240, 1973.</mixed-citation></ref>
      <ref id="bib1.bib37"><label>37</label><mixed-citation>
Gasteiger, J. and Zupan, J.: Neural networks in chemistry, Angew. Chem. Int.
Edit., 32, 503–527, 1993.</mixed-citation></ref>
      <ref id="bib1.bib38"><label>38</label><mixed-citation>
Gordon, G. E.: Receptor models, Environ. Sci. Technol., 22, 1132–1142, 1988.</mixed-citation></ref>
      <ref id="bib1.bib39"><label>39</label><mixed-citation>Gysel, M., Crosier, J., Topping, D. O., Whitehead, J. D., Bower, K. N.,
Cubison, M. J., Williams, P. I., Flynn, M. J., McFiggans, G. B., and Coe, H.:
Closure study between chemical composition and hygroscopic growth of aerosol
particles during TORCH2, Atmos. Chem. Phys., 7, 6131–6144,
<ext-link xlink:href="https://doi.org/10.5194/acp-7-6131-2007" ext-link-type="DOI">10.5194/acp-7-6131-2007</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib40"><label>40</label><mixed-citation>Hao, L. Q., Kortelainen, A., Romakkaniemi, S., Portin, H., Jaatinen, A.,
Leskinen, A., Komppula, M., Miettinen, P., Sueper, D., Pajunoja, A., Smith,
J. N., Lehtinen, K. E. J., Worsnop, D. R., Laaksonen, A., and Virtanen, A.:
Atmospheric submicron aerosol composition and particulate organic nitrate
formation in a boreal forestland–urban mixed region, Atmos. Chem. Phys., 14,
13483–13495, <ext-link xlink:href="https://doi.org/10.5194/acp-14-13483-2014" ext-link-type="DOI">10.5194/acp-14-13483-2014</ext-link>, 2014.</mixed-citation></ref>
      <ref id="bib1.bib41"><label>41</label><mixed-citation>
Hari, P. and Kulmala, M.: Station for measuring ecosystem-atmosphere
relations (SMEAR II), Boreal Environ. Res., 10, 315–322, 2005.</mixed-citation></ref>
      <ref id="bib1.bib42"><label>42</label><mixed-citation>
Haynes, W. M.: CRC handbook of chemistry and physics, CRC press, Boca Raton,
FL, USA, 2014.</mixed-citation></ref>
      <ref id="bib1.bib43"><label>43</label><mixed-citation>Hersey, S. P., Craven, J. S., Schilling, K. A., Metcalf, A. R., Sorooshian,
A., Chan, M. N., Flagan, R. C., and Seinfeld, J. H.: The Pasadena Aerosol
Characterization Observatory (PACO): chemical and physical analysis of the
Western Los Angeles basin aerosol, Atmos. Chem. Phys., 11, 7417–7443,
<ext-link xlink:href="https://doi.org/10.5194/acp-11-7417-2011" ext-link-type="DOI">10.5194/acp-11-7417-2011</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib44"><label>44</label><mixed-citation>
Hoffmann, D., Tilgner, A., Iinuma, Y., and Herrmann, H.: Atmospheric
stability of levoglucosan: a detailed laboratory and modeling study, Environ.
Sci. Technol., 44, 694–699, 2009.</mixed-citation></ref>
      <ref id="bib1.bib45"><label>45</label><mixed-citation>Hong, J., Äijälä, M., Häme, S. A. K., Hao, L., Duplissy, J.,
Heikkinen, L. M., Nie, W., Mikkilä, J., Kulmala, M., Prisle, N. L.,
Virtanen, A., Ehn, M., Paasonen, P., Worsnop, D. R., Riipinen, I.,
Petäjä, T., and Kerminen, V.-M.: Estimates of the organic aerosol
volatility in a boreal forest using two independent methods, Atmos. Chem.
Phys., 17, 4387–4399, <ext-link xlink:href="https://doi.org/10.5194/acp-17-4387-2017" ext-link-type="DOI">10.5194/acp-17-4387-2017</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib46"><label>46</label><mixed-citation>
Hopke, P. K.: Receptor modeling for air quality management, Elsevier,
Amsterdam, the Netherlands, 1991.</mixed-citation></ref>
      <ref id="bib1.bib47"><label>47</label><mixed-citation>
Hopke, P. K.: Review of receptor modeling methods for source apportionment,
J. Air Waste Manage., 66, 237–259, 2016.</mixed-citation></ref>
      <ref id="bib1.bib48"><label>48</label><mixed-citation>Horai, H., Arita, M., Kanaya, S., Nihei, Y., Ikeda, T., Suwa, K., Ojima, Y.,
Tanaka, K., Tanaka, S., Aoshima, K., Oda, Y., Kakazu, Y., Kusano, M., Tohge,
T., Matsuda, F., Sawada, Y., Hirai, M. Y., Nakanishi, H., Ikeda, K., Akimoto,
N., Maoka, T., Takahashi, H., Ara, T., Sakurai, N., Suzuki, H., Shibata, D.,
Neumann, S., Iida, T., Tanaka, K., Funatsu, K., Matsuura, F., Soga, T.,
Taguchi, R., Saito, K., and Nishioka, T.: MassBank: a public repository for
sharing mass spectral data for life sciences, J. Mass Spectrom., 45,
703–714, <ext-link xlink:href="https://doi.org/10.1002/jms.1777" ext-link-type="DOI">10.1002/jms.1777</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib49"><label>49</label><mixed-citation>Irei, S., Shimono, A., Hikida, T., Kuramoto, K., Suzuki, Y., and Takami, A.:
Qualitative evaluation of <inline-formula><mml:math id="M357" display="inline"><mml:mrow><mml:mi>m</mml:mi><mml:mo>/</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:math></inline-formula> 85, 87, and 133 signals in organic aerosol
mass spectra of fly ash produced by coal combustion, Aerosol Air Qual. Res.,
14, 406–412, 2014.</mixed-citation></ref>
      <ref id="bib1.bib50"><label>50</label><mixed-citation>
Jain, A. K.: Data clustering: 50 years beyond K-means, Pattern Recogn. Lett.,
31, 651–666, 2010.</mixed-citation></ref>
      <ref id="bib1.bib51"><label>51</label><mixed-citation>Jimenez, J. L., Canagaratna, M. R., Donahue, N. M., Prevot, A. S., Zhang, Q.,
Kroll, J. H., DeCarlo, P. F., Allan, J. D., Coe, H., Ng, N. L., Aiken, A. C.,
Docherty, K. S., Ulbrich, I. M., Grieshop, A. P., Robinson, A. L., Duplissy,
J., Smith, J. D., Wilson, K. R., Lanz, V. A., Hueglin, C., Sun, Y. L., Tian,
J., Laaksonen, A., Raatikainen, T., Rautiainen, J., Vaattovaara, P., Ehn, M.,
Kulmala, M., Tomlinson, J. M., Collins, D. R., Cubison, M. J., Dunlea, E. J.,
Huffman, J. A., Onasch, T. B., Alfarra, M. R., Williams, P. I., Bower, K.,
Kondo, Y., Schneider, J., Drewnick, F., Borrmann, S., Weimer, S., Demerjian,
K., Salcedo, D., Cottrell, L., Griffin, R., Takami, A., Miyoshi, T.,
Hatakeyama, S., Shimono, A., Sun, J. Y., Zhang, Y. M., Dzepina, K., Kimmel,
J. R., Sueper, D., Jayne, J. T., Herndon, S. C., Trimborn, A. M., Williams,
L. R., Wood, E. C., Middlebrook, A. M., Kolb, C. E., Baltensperger, U., and
Worsnop, D. R.: Evolution of organic aerosols in the atmosphere, Science,
326, 1525–1529, <ext-link xlink:href="https://doi.org/10.1126/science.1180353" ext-link-type="DOI">10.1126/science.1180353</ext-link>, 2009.</mixed-citation></ref>
      <?pagebreak page3670?><ref id="bib1.bib52"><label>52</label><mixed-citation>
Kiendler-Scharr, A., Mensah, A. A., Friese, E., Topping, D., Nemitz, E.,
Prevot, A., Äijälä, M., Allan, J., Canonaco, F., and Canagaratna,
M.: Ubiquity of organic nitrates from nighttime chemistry in the European
submicron aerosol, Geophys. Res. Lett., 43, 7735–7744, 2016.</mixed-citation></ref>
      <ref id="bib1.bib53"><label>53</label><mixed-citation>Kim, S., Koo, I., Wei, X., and Zhang, X.: A method of finding optimal weight
factors for compound identification in gas chromatography-mass spectrometry,
Bioinformatics, 28, 1158–1163, <ext-link xlink:href="https://doi.org/10.1093/bioinformatics/bts083" ext-link-type="DOI">10.1093/bioinformatics/bts083</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bib54"><label>54</label><mixed-citation>
Kowalski, B. R.: Measurement analysis by pattern recognition, Anal. Chem.,
47, 1152A–1162a, 1975.</mixed-citation></ref>
      <ref id="bib1.bib55"><label>55</label><mixed-citation>
Kroll, J. H. and Seinfeld, J. H.: Chemistry of secondary organic aerosol:
Formation and evolution of low-volatility organics in the atmosphere, Atmos.
Environ., 42, 3593–3624, 2008.</mixed-citation></ref>
      <ref id="bib1.bib56"><label>56</label><mixed-citation>
Kulmala, M., Rannik, Ü., Pirjola, L., Dal Maso, M., Karimäki, J.,
Asmi, A., Jäppinen, A., Karhu, V., Korhonen, H., and Malvikko, S.-P.:
Characterization of atmospheric trace gas and aerosol concentrations at
forest sites in southern and northern Finland using back trajectories, Boreal
Environ. Res., 5, 315–336, 2000.</mixed-citation></ref>
      <ref id="bib1.bib57"><label>57</label><mixed-citation>Kulmala, M., Asmi, A., Lappalainen, H. K., Carslaw, K. S., Pöschl, U.,
Baltensperger, U., Hov, Ø., Brenquier, J.-L., Pandis, S. N., Facchini, M.
C., Hansson, H.-C., Wiedensohler, A., and O'Dowd, C. D.: Introduction:
European Integrated Project on Aerosol Cloud Climate and Air Quality
interactions (EUCAARI) – integrating aerosol research from nano to global
scales, Atmos. Chem. Phys., 9, 2825–2841,
<ext-link xlink:href="https://doi.org/10.5194/acp-9-2825-2009" ext-link-type="DOI">10.5194/acp-9-2825-2009</ext-link>, 2009.</mixed-citation></ref>
      <ref id="bib1.bib58"><label>58</label><mixed-citation>Kulmala, M., Asmi, A., Lappalainen, H. K., Baltensperger, U., Brenguier,
J.-L., Facchini, M. C., Hansson, H.-C., Hov, Ø., O'Dowd, C. D.,
Pöschl, U., Wiedensohler, A., Boers, R., Boucher, O., de Leeuw, G.,
Denier van der Gon, H. A. C., Feichter, J., Krejci, R., Laj, P., Lihavainen,
H., Lohmann, U., McFiggans, G., Mentel, T., Pilinis, C., Riipinen, I.,
Schulz, M., Stohl, A., Swietlicki, E., Vignati, E., Alves, C., Amann, M.,
Ammann, M., Arabas, S., Artaxo, P., Baars, H., Beddows, D. C. S.,
Bergström, R., Beukes, J. P., Bilde, M., Burkhart, J. F., Canonaco, F.,
Clegg, S. L., Coe, H., Crumeyrolle, S., D'Anna, B., Decesari, S., Gilardoni,
S., Fischer, M., Fjaeraa, A. M., Fountoukis, C., George, C., Gomes, L.,
Halloran, P., Hamburger, T., Harrison, R. M., Herrmann, H., Hoffmann, T.,
Hoose, C., Hu, M., Hyvärinen, A., Hõrrak, U., Iinuma, Y., Iversen,
T., Josipovic, M., Kanakidou, M., Kiendler-Scharr, A., Kirkevåg, A.,
Kiss, G., Klimont, Z., Kolmonen, P., Komppula, M., Kristjánsson, J.-E.,
Laakso, L., Laaksonen, A., Labonnote, L., Lanz, V. A., Lehtinen, K. E. J.,
Rizzo, L. V., Makkonen, R., Manninen, H. E., McMeeking, G., Merikanto, J.,
Minikin, A., Mirme, S., Morgan, W. T., Nemitz, E., O'Donnell, D., Panwar, T.
S., Pawlowska, H., Petzold, A., Pienaar, J. J., Pio, C., Plass-Duelmer, C.,
Prévôt, A. S. H., Pryor, S., Reddington, C. L., Roberts, G.,
Rosenfeld, D., Schwarz, J., Seland, Ø., Sellegri, K., Shen, X. J.,
Shiraiwa, M., Siebert, H., Sierau, B., Simpson, D., Sun, J. Y., Topping, D.,
Tunved, P., Vaattovaara, P., Vakkari, V., Veefkind, J. P., Visschedijk, A.,
Vuollekoski, H., Vuolo, R., Wehner, B., Wildt, J., Woodward, S., Worsnop, D.
R., van Zadelhoff, G.-J., Zardini, A. A., Zhang, K., van Zyl, P. G.,
Kerminen, V.-M., S Carslaw, K., and Pandis, S. N.: General overview: European
Integrated project on Aerosol Cloud Climate and Air Quality interactions
(EUCAARI) – integrating aerosol research from nano to global scales, Atmos.
Chem. Phys., 11, 13061–13143, <ext-link xlink:href="https://doi.org/10.5194/acp-11-13061-2011" ext-link-type="DOI">10.5194/acp-11-13061-2011</ext-link>,
2011.</mixed-citation></ref>
      <ref id="bib1.bib59"><label>59</label><mixed-citation>Lanz, V. A., Alfarra, M. R., Baltensperger, U., Buchmann, B., Hueglin, C.,
and Prévôt, A. S. H.: Source apportionment of submicron organic
aerosols at an urban site by factor analytical modelling of aerosol mass
spectra, Atmos. Chem. Phys., 7, 1503–1522,
<ext-link xlink:href="https://doi.org/10.5194/acp-7-1503-2007" ext-link-type="DOI">10.5194/acp-7-1503-2007</ext-link>, 2007a.</mixed-citation></ref>
      <ref id="bib1.bib60"><label>60</label><mixed-citation>
Lanz, V. A., Alfarra, M. R., Baltensperger, U., Buchmann, B., Hueglin, C.,
Szidat, S., Wehrli, M. N., Wacker, L., Weimer, S., and Caseiro, A.: Source
attribution of submicron organic aerosols during wintertime inversions by
advanced factor analysis of aerosol mass spectra, Environ. Sci. Technol., 42,
214–220, 2007b.</mixed-citation></ref>
      <ref id="bib1.bib61"><label>61</label><mixed-citation>
Lee, B. H., Mohr, C., Lopez-Hilfiker, F. D., Lutz, A., Hallquist, M., Lee,
L., Romer, P., Cohen, R. C., Iyer, S., and Kurtén, T.: Highly
functionalized organic nitrates in the southeast United States: Contribution
to secondary organic aerosol and reactive nitrogen budgets, P. Natl. Acad.
Sci. USA, 113, 1516–1521, 2016.</mixed-citation></ref>
      <ref id="bib1.bib62"><label>62</label><mixed-citation>Li, J., Pósfai, M., Hobbs, P. V., and Buseck, P. R.: Individual aerosol
particles from biomass burning in southern Africa: 2. Compositions and aging
of inorganic particles, J. Geophys. Res.-Atmos., 108, 8484,
<ext-link xlink:href="https://doi.org/10.1029/2002JD002310" ext-link-type="DOI">10.1029/2002JD002310</ext-link>, 2003.</mixed-citation></ref>
      <ref id="bib1.bib63"><label>63</label><mixed-citation>Liang, Z., Chen, L., Alam, M. S., Rezaei, S. Z., Stark, C., Xu, H., and
Harrison, R. M.: Comprehensive chemical characterization of lubricating oils
used in modern vehicular engines utilizing GC<inline-formula><mml:math id="M358" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula>GC-TOFMS, Fuel, 220,
792–799, 2018.</mixed-citation></ref>
      <ref id="bib1.bib64"><label>64</label><mixed-citation>
Lindon, J. C., Tranter, G. E., and Koppenaal, D.: Encyclopedia of
spectroscopy and spectrometry, Academic Press, San Diego, USA, 2016.</mixed-citation></ref>
      <ref id="bib1.bib65"><label>65</label><mixed-citation>
Liu, P. S., Deng, R., Smith, K. A., Williams, L. R., Jayne, J. T.,
Canagaratna, M. R., Moore, K., Onasch, T. B., Worsnop, D. R., and Deshler,
T.: Transmission efficiency of an aerodynamic focusing lens system:
Comparison of model calculations and laboratory measurements for the Aerodyne
Aerosol Mass Spectrometer, Aerosol Sci. Tech., 41, 721–733, 2007.</mixed-citation></ref>
      <ref id="bib1.bib66"><label>66</label><mixed-citation>
MacQueen, J.: Some methods for classification and analysis of multivariate
observations, Proceedings of the fifth Berkeley symposium on mathematical
statistics and probability, 21 June–18 July 1965 and 27 December
1965–7 January 1966, Statistical Laboratory of the University of California,
Berkeley, USA, 281–297, 1967.</mixed-citation></ref>
      <ref id="bib1.bib67"><label>67</label><mixed-citation>Mclafferty, F. W.: Mass Spectrometric Analysis – Molecular Rearrangements,
Anal. Chem., 31, 82–87, <ext-link xlink:href="https://doi.org/10.1021/ac60145a015" ext-link-type="DOI">10.1021/ac60145a015</ext-link>, 1959.</mixed-citation></ref>
      <ref id="bib1.bib68"><label>68</label><mixed-citation>
McLafferty, F. W. and Turecek, F.: Interpretation of mass spectra, University
science books, Mill Valley, CA, USA, 1993.</mixed-citation></ref>
      <ref id="bib1.bib69"><label>69</label><mixed-citation>Mcquitty, L. L.: Similarity Analysis by Reciprocal Pairs for Discrete and
Continuous Data, Educ. Psychol. Meas., 26, 825–831,
<ext-link xlink:href="https://doi.org/10.1177/001316446602600402" ext-link-type="DOI">10.1177/001316446602600402</ext-link>, 1966.</mixed-citation></ref>
      <ref id="bib1.bib70"><label>70</label><mixed-citation>
Miller, M., Friedlander, S., and Hidy, G.: A chemical element balance for the
Pasadena aerosol, in: Aerosols and atmospheric chemistry, Academic Press, New
York, USA, 301–312, 1972.</mixed-citation></ref>
      <ref id="bib1.bib71"><label>71</label><mixed-citation>
Mohr, C., Huffman, A., Cubison, M. J., Aiken, A. C., Docherty, K. S., Kimmel,
J. R., Ulbrich, I. M., Hannigan, M., and Jimenez, J. L.: Characterization of
primary organic aerosol emissions from meat cooking, trash burning, and motor
vehicles with high-resolution aerosol mass spectrometry and comparison with
ambient and chamber observations, Environ. Sci. Technol., 43, 2443–2449,
2009.</mixed-citation></ref>
      <?pagebreak page3671?><ref id="bib1.bib72"><label>72</label><mixed-citation>Mohr, C., DeCarlo, P. F., Heringa, M. F., Chirico, R., Slowik, J. G.,
Richter, R., Reche, C., Alastuey, A., Querol, X., Seco, R., Peñuelas, J.,
Jiménez, J. L., Crippa, M., Zimmermann, R., Baltensperger, U., and
Prévôt, A. S. H.: Identification and quantification of organic
aerosol from cooking and other sources in Barcelona using aerosol mass
spectrometer data, Atmos. Chem. Phys., 12, 1649–1665,
<ext-link xlink:href="https://doi.org/10.5194/acp-12-1649-2012" ext-link-type="DOI">10.5194/acp-12-1649-2012</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bib73"><label>73</label><mixed-citation>Murphy, S. M., Sorooshian, A., Kroll, J. H., Ng, N. L., Chhabra, P., Tong,
C., Surratt, J. D., Knipping, E., Flagan, R. C., and Seinfeld, J. H.:
Secondary aerosol formation from atmospheric reactions of aliphatic amines,
Atmos. Chem. Phys., 7, 2313–2337, <ext-link xlink:href="https://doi.org/10.5194/acp-7-2313-2007" ext-link-type="DOI">10.5194/acp-7-2313-2007</ext-link>,
2007.</mixed-citation></ref>
      <ref id="bib1.bib74"><label>74</label><mixed-citation>Ng, N. L., Canagaratna, M. R., Zhang, Q., Jimenez, J. L., Tian, J., Ulbrich,
I. M., Kroll, J. H., Docherty, K. S., Chhabra, P. S., Bahreini, R., Murphy,
S. M., Seinfeld, J. H., Hildebrandt, L., Donahue, N. M., DeCarlo, P. F.,
Lanz, V. A., Prévôt, A. S. H., Dinar, E., Rudich, Y., and Worsnop, D.
R.: Organic aerosol components observed in Northern Hemispheric datasets from
Aerosol Mass Spectrometry, Atmos. Chem. Phys., 10, 4625–4641,
<ext-link xlink:href="https://doi.org/10.5194/acp-10-4625-2010" ext-link-type="DOI">10.5194/acp-10-4625-2010</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib75"><label>75</label><mixed-citation>Ng, N. L., Canagaratna, M. R., Jimenez, J. L., Zhang, Q., Ulbrich, I. M., and
Worsnop, D. R.: Real-time methods for estimating organic component mass
concentrations from aerosol mass spectrometer data, Environ. Sci. Technol.,
45, 910–916, <ext-link xlink:href="https://doi.org/10.1021/es102951k" ext-link-type="DOI">10.1021/es102951k</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib76"><label>76</label><mixed-citation>Niemi, J. V., Saarikoski, S., Aurela, M., Tervahattu, H., Hillamo, R.,
Westphal, D. L., Aarnio, P., Koskentalo, T., Makkonen, U., Vehkamaki, H., and
Kulmala, M.: Long-range transport episodes of fine particles in southern
Finland during 1999–2007, Atmos. Environ., 43, 1255–1264,
<ext-link xlink:href="https://doi.org/10.1016/j.atmosenv.2008.11.022" ext-link-type="DOI">10.1016/j.atmosenv.2008.11.022</ext-link>, 2009.</mixed-citation></ref>
      <ref id="bib1.bib77"><label>77</label><mixed-citation>
Orlando, J. J. and Tyndall, G. S.: Laboratory studies of organic peroxy
radical chemistry: an overview with emphasis on recent issues of atmospheric
significance, Chem. Soc. Rev., 41, 6294–6317, 2012.</mixed-citation></ref>
      <ref id="bib1.bib78"><label>78</label><mixed-citation>
Osborne, J. W., Costello, A. B., and Kellow, J. T.: Best practices in
exploratory factor analysis, CreateSpace Independent Publishing Platform,
Charleston, SC, USA, 2014.</mixed-citation></ref>
      <ref id="bib1.bib79"><label>79</label><mixed-citation>Paatero, P.: Least squares formulation of robust non-negative factor
analysis, Chemometr. Intell. Lab., 37, 23–35,
<ext-link xlink:href="https://doi.org/10.1016/S0169-7439(96)00044-5" ext-link-type="DOI">10.1016/S0169-7439(96)00044-5</ext-link>, 1997.</mixed-citation></ref>
      <ref id="bib1.bib80"><label>80</label><mixed-citation>Paatero, P.: The multilinear engine – A table-driven, least squares program
for solving multilinear problems, including the n-way parallel factor
analysis model, J. Comput. Graph. Stat., 8, 854–888, <ext-link xlink:href="https://doi.org/10.2307/1390831" ext-link-type="DOI">10.2307/1390831</ext-link>,
1999.</mixed-citation></ref>
      <ref id="bib1.bib81"><label>81</label><mixed-citation>
Paatero, P.: User's guide for positive matrix factorization programs PMF2 and
PMF3, University of Helsinki, Helsinki, Finland, 2000.</mixed-citation></ref>
      <ref id="bib1.bib82"><label>82</label><mixed-citation>
Paatero, P. and Tapper, U.: Positive matrix factorization: A non-negative
factor model with optimal utilization of error estimates of data values,
Environmetrics, 5, 111–126, 1994.</mixed-citation></ref>
      <ref id="bib1.bib83"><label>83</label><mixed-citation>Patokoski, J., Ruuskanen, T. M., Kajos, M. K., Taipale, R., Rantala, P.,
Aalto, J., Ryyppö, T., Nieminen, T., Hakola, H., and Rinne, J.: Sources
of long-lived atmospheric VOCs at the rural boreal forest site, SMEAR II,
Atmos. Chem. Phys., 15, 13413–13432,
<ext-link xlink:href="https://doi.org/10.5194/acp-15-13413-2015" ext-link-type="DOI">10.5194/acp-15-13413-2015</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib84"><label>84</label><mixed-citation>
Peräkylä, O., Vogt, M., Tikkanen, O.-P., Laurila, T., Kajos, M. K.,
Rantala, P. A., Patokoski, J., Aalto, J., Yli-Juuti, T., and Ehn, M.:
Monoterpenes' oxidation capacity and rate over a boreal forest (suppl. B),
Boreal Environ. Res., 19, 293–310, 2014.</mixed-citation></ref>
      <ref id="bib1.bib85"><label>85</label><mixed-citation>Pieber, S. M., El Haddad, I., Slowik, J. G., Canagaratna, M. R., Jayne, J.
T., Platt, S. M., Bozzetti, C., Daellenbach, K. R., Fröhlich, R., and
Vlachou, A.: Inorganic salt interference on <inline-formula><mml:math id="M359" display="inline"><mml:mrow class="chem"><mml:msubsup><mml:mi mathvariant="normal">CO</mml:mi><mml:mn mathvariant="normal">2</mml:mn><mml:mo>+</mml:mo></mml:msubsup></mml:mrow></mml:math></inline-formula> in aerodyne AMS
and ACSM organic aerosol composition studies, Environ. Sci. Technol., 50,
10494–10503, 2016.</mixed-citation></ref>
      <ref id="bib1.bib86"><label>86</label><mixed-citation>
Rasulev, U. K. and Zandberg, E. Y.: Surface ionization of organic compounds
and its applications, Prog. Surf. Sci., 28, 181–412, 1988.</mixed-citation></ref>
      <ref id="bib1.bib87"><label>87</label><mixed-citation>Rebotier, T. P. and Prather, K. A.: Aerosol time-of-flight mass spectrometry
data analysis: a benchmark of clustering algorithms, Anal. Chim. Acta, 585,
38–54, <ext-link xlink:href="https://doi.org/10.1016/j.aca.2006.12.009" ext-link-type="DOI">10.1016/j.aca.2006.12.009</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib88"><label>88</label><mixed-citation>
Reilly, P. and Wood, R. H.: Prediction of the properties of mixed
electrolytes from measurements on common ion mixtures, J. Phys. Chem., 73,
4292–4297, 1969.</mixed-citation></ref>
      <ref id="bib1.bib89"><label>89</label><mixed-citation>Robinson, N. H., Hamilton, J. F., Allan, J. D., Langford, B., Oram, D. E.,
Chen, Q., Docherty, K., Farmer, D. K., Jimenez, J. L., Ward, M. W., Hewitt,
C. N., Barley, M. H., Jenkin, M. E., Rickard, A. R., Martin, S. T.,
McFiggans, G., and Coe, H.: Evidence for a significant proportion of
Secondary Organic Aerosol from isoprene above a maritime tropical forest,
Atmos. Chem. Phys., 11, 1039–1050, <ext-link xlink:href="https://doi.org/10.5194/acp-11-1039-2011" ext-link-type="DOI">10.5194/acp-11-1039-2011</ext-link>,
2011.</mixed-citation></ref>
      <ref id="bib1.bib90"><label>90</label><mixed-citation>Rousseeuw, P. J.: Silhouettes – a Graphical Aid to the Interpretation and
Validation of Cluster-Analysis, J. Comput. Appl. Math., 20, 53–65,
<ext-link xlink:href="https://doi.org/10.1016/0377-0427(87)90125-7" ext-link-type="DOI">10.1016/0377-0427(87)90125-7</ext-link>, 1987.</mixed-citation></ref>
      <ref id="bib1.bib91"><label>91</label><mixed-citation>Schneider, J., Weimer, S., Drewnick, F., Borrmann, S., Helas, G., Gwaze, P.,
Schmid, O., Andreae, M. O., and Kirchner, U.: Mass spectrometric analysis and
aerodynamic properties of various types of combustion-related aerosol
particles, Int. J. Mass Spectrom., 258, 37–49,
<ext-link xlink:href="https://doi.org/10.1016/j.ijms.2006.07.008" ext-link-type="DOI">10.1016/j.ijms.2006.07.008</ext-link>, 2006.</mixed-citation></ref>
      <ref id="bib1.bib92"><label>92</label><mixed-citation>
Shafizadeh, F.: The chemistry of pyrolysis and combustion, The chemistry of
solid wood, in: Advances in Chemistry Series, edited by: Rowell, R. M.,
Number 207, North American Chemical Society, Washington, D.C., USA, 489–529,
1984.</mixed-citation></ref>
      <ref id="bib1.bib93"><label>93</label><mixed-citation>Sofowote, U. M., Su, Y., Dabek-Zlotorzynska, E., Rastogi, A. K., Brook, J.,
and Hopke, P. K.: Constraining the factor analytical solutions obtained from
multiple-year receptor modeling of ambient PM<inline-formula><mml:math id="M360" display="inline"><mml:msub><mml:mi/><mml:mn mathvariant="normal">2.5</mml:mn></mml:msub></mml:math></inline-formula> data from five
speciation sites in Ontario, Canada, Atmos. Environ., 108, 151–157, 2015.</mixed-citation></ref>
      <ref id="bib1.bib94"><label>94</label><mixed-citation>
Sogacheva, L., Dal Maso, M., Kerminen, V.-M., and Kulmala, M.: Probability of
nucleation events and aerosol particle concentration in different air mass
types arriving at Hyytiälä, southern Finland, based on back
trajectories analysis, Boreal Environ. Res., 10, 479–491, 2005.</mixed-citation></ref>
      <ref id="bib1.bib95"><label>95</label><mixed-citation>Stein, S. E. and Scott, D. R.: Optimization and testing of mass spectral
library search algorithms for compound identification, J. Am. Soc. Mass
Spectrom., 5, 859–866, <ext-link xlink:href="https://doi.org/10.1016/1044-0305(94)87009-8" ext-link-type="DOI">10.1016/1044-0305(94)87009-8</ext-link>, 1994.</mixed-citation></ref>
      <ref id="bib1.bib96"><label>96</label><mixed-citation>
Steinhaus, H.: Sur la division des corp materiels en parties, Bull. Acad.
Polon. Sci., 1, 801–804, 1956.</mixed-citation></ref>
      <ref id="bib1.bib97"><label>97</label><mixed-citation>Sun, Y. L., Zhang, Q., Schwab, J. J., Yang, T., Ng, N. L., and Demerjian, K.
L.: Factor analysis of combined organic and inorganic aerosol mass spectra
from high resolution aerosol mass spectrometer measurements, Atmos. Chem.
Phys., 12, 8537–8551, <ext-link xlink:href="https://doi.org/10.5194/acp-12-8537-2012" ext-link-type="DOI">10.5194/acp-12-8537-2012</ext-link>, 2012.</mixed-citation></ref>
      <?pagebreak page3672?><ref id="bib1.bib98"><label>98</label><mixed-citation>
Swietlicki, E., Hansson, H.-C., Hämeri, K., Svenningsson, B., Massling,
A., McFiggans, G., McMurry, P., Petäjä, T., Tunved, P., and Gysel,
M.: Hygroscopic properties of submicrometer atmospheric aerosol particles
measured with H-TDMA instruments in various environments – a review, Tellus
B, 60, 432–469, 2008.</mixed-citation></ref>
      <ref id="bib1.bib99"><label>99</label><mixed-citation>Takami, A., Miyoshi, T., Shimono, A., Kaneyasu, N., Kato, S., Kajii, Y., and
Hatakeyama, S.: Transport of anthropogenic aerosols from Asia and subsequent
chemical transformation, J. Geophys. Res.-Atmos., 112, D22S31,
<ext-link xlink:href="https://doi.org/10.1029/2006JD008120" ext-link-type="DOI">10.1029/2006JD008120</ext-link>, 2007.</mixed-citation></ref>
      <ref id="bib1.bib100"><label>100</label><mixed-citation>Ulbrich, I. M., Canagaratna, M. R., Zhang, Q., Worsnop, D. R., and Jimenez,
J. L.: Interpretation of organic components from Positive Matrix
Factorization of aerosol mass spectrometric data, Atmos. Chem. Phys., 9,
2891–2918, <ext-link xlink:href="https://doi.org/10.5194/acp-9-2891-2009" ext-link-type="DOI">10.5194/acp-9-2891-2009</ext-link>, 2009.</mixed-citation></ref>
      <ref id="bib1.bib101"><label>101</label><mixed-citation>Vogel, A. L., Äijälä, M., Corrigan, A. L., Junninen, H., Ehn, M.,
Petäjä, T., Worsnop, D. R., Kulmala, M., Russell, L. M., Williams,
J., and Hoffmann, T.: In situ submicron organic aerosol characterization at a
boreal forest research station during HUMPPA-COPEC 2010 using soft and hard
ionization mass spectrometry, Atmos. Chem. Phys., 13, 10933–10950,
<ext-link xlink:href="https://doi.org/10.5194/acp-13-10933-2013" ext-link-type="DOI">10.5194/acp-13-10933-2013</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib102"><label>102</label><mixed-citation>Williams, J., Crowley, J., Fischer, H., Harder, H., Martinez, M.,
Petäjä, T., Rinne, J., Bäck, J., Boy, M., Dal Maso, M., Hakala,
J., Kajos, M., Keronen, P., Rantala, P., Aalto, J., Aaltonen, H., Paatero,
J., Vesala, T., Hakola, H., Levula, J., Pohja, T., Herrmann, F., Auld, J.,
Mesarchaki, E., Song, W., Yassaa, N., Nölscher, A., Johnson, A. M.,
Custer, T., Sinha, V., Thieser, J., Pouvesle, N., Taraborrelli, D., Tang, M.
J., Bozem, H., Hosaynali-Beygi, Z., Axinte, R., Oswald, R., Novelli, A.,
Kubistin, D., Hens, K., Javed, U., Trawny, K., Breitenberger, C., Hidalgo, P.
J., Ebben, C. J., Geiger, F. M., Corrigan, A. L., Russell, L. M., Ouwersloot,
H. G., Vilà-Guerau de Arellano, J., Ganzeveld, L., Vogel, A., Beck, M.,
Bayerle, A., Kampf, C. J., Bertelmann, M., Köllner, F., Hoffmann, T.,
Valverde, J., González, D., Riekkola, M.-L., Kulmala, M., and Lelieveld,
J.: The summertime Boreal forest field measurement intensive
(HUMPPA-COPEC-2010): an overview of meteorological and chemical influences,
Atmos. Chem. Phys., 11, 10599–10618,
<ext-link xlink:href="https://doi.org/10.5194/acp-11-10599-2011" ext-link-type="DOI">10.5194/acp-11-10599-2011</ext-link>, 2011.
</mixed-citation></ref><?xmltex \hack{\newpage}?>
      <ref id="bib1.bib103"><label>103</label><mixed-citation>
Worton, D. R., Isaacman, G., Gentner, D. R., Dallmann, T. R., Chan, A. W.,
Ruehl, C., Kirchstetter, T. W., Wilson, K. R., Harley, R. A., and Goldstein,
A. H.: Lubricating oil dominates primary organic aerosol emissions from motor
vehicles, Environ. Sci. Technol., 48, 3698–3706, 2014.</mixed-citation></ref>
      <ref id="bib1.bib104"><label>104</label><mixed-citation>
Yatavelli, R. L., Mohr, C., Stark, H., Day, D. A., Thompson, S. L.,
Lopez-Hilfiker, F. D., Campuzano-Jost, P., Palm, B. B., Vogel, A. L., and
Hoffmann, T.: Estimating the contribution of organic acids to northern
hemispheric continental organic aerosol, Geophys. Res. Lett., 42, 6084–6090,
2015.</mixed-citation></ref>
      <ref id="bib1.bib105"><label>105</label><mixed-citation>
Ye, Q., Robinson, E. S., Ding, X., Ye, P., Sullivan, R. C., and Donahue, N.
M.: Mixing of secondary organic aerosols versus relative humidity, P. Natl.
Acad. Sci. USA, 113, 12649–12654, 2016.</mixed-citation></ref>
      <ref id="bib1.bib106"><label>106</label><mixed-citation>
Zhang, Q., Alfarra, M. R., Worsnop, D. R., Allan, J. D., Coe, H.,
Canagaratna, M. R., and Jimenez, J. L.: Deconvolution and quantification of
hydrocarbon-like and oxygenated organic aerosols based on aerosol mass
spectrometry, Environ. Sci. Technol., 39, 4938–4952, 2005.</mixed-citation></ref>
      <ref id="bib1.bib107"><label>107</label><mixed-citation>Zhang, Q., Jimenez, J. L., Canagaratna, M. R., Ulbrich, I. M., Ng, N. L.,
Worsnop, D. R., and Sun, Y.: Understanding atmospheric organic aerosols via
factor analysis of aerosol mass spectrometry: a review, Anal. Bioanal. Chem.,
401, 3045–3067, <ext-link xlink:href="https://doi.org/10.1007/s00216-011-5355-y" ext-link-type="DOI">10.1007/s00216-011-5355-y</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib108"><label>108</label><mixed-citation>Zieger, P., Aalto, P. P., Aaltonen, V., Äijälä, M., Backman, J.,
Hong, J., Komppula, M., Krejci, R., Laborde, M., Lampilahti, J., de Leeuw,
G., Pfüller, A., Rosati, B., Tesche, M., Tunved, P.,
Väänänen, R., and Petäjä, T.: Low hygroscopic scattering
enhancement of boreal aerosol and the implications for a columnar optical
closure study, Atmos. Chem. Phys., 15, 7247–7267,
<ext-link xlink:href="https://doi.org/10.5194/acp-15-7247-2015" ext-link-type="DOI">10.5194/acp-15-7247-2015</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib109"><label>109</label><mixed-citation>Zimmermann, R.: Aerosols and health: a challenge for chemical and biological
analysis, Anal. Bioanal. Chem., 407, 5863–5867,
<ext-link xlink:href="https://doi.org/10.1007/s00216-015-8832-x" ext-link-type="DOI">10.1007/s00216-015-8832-x</ext-link>, 2015.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>Constructing a data-driven receptor model for organic and inorganic aerosol – a synthesis analysis of eight mass spectrometric data sets from a boreal forest site</article-title-html>
<abstract-html><p>The interactions between organic and
inorganic aerosol chemical components are integral to understanding and
modelling climate and health-relevant aerosol physicochemical properties,
such as volatility, hygroscopicity, light scattering and toxicity. This study
presents a synthesis analysis for eight data sets, of non-refractory aerosol
composition, measured at a boreal forest site. The measurements, performed
with an aerosol mass spectrometer, cover in total around 9 months over the
course of 3 years. In our statistical analysis, we use the complete organic
and inorganic unit-resolution mass spectra, as opposed to the more common
approach of only including the organic fraction. The analysis is based on
iterative, combined use of (1) data reduction, (2) classification and
(3) scaling tools, producing a data-driven chemical mass balance type of
model capable of describing site-specific aerosol composition. The receptor
model we constructed was able to explain 83±8&thinsp;% of variation in
data, which increased to 96±3&thinsp;% when signals from low
signal-to-noise variables were not considered. The resulting interpretation
of an extensive set of aerosol mass spectrometric data infers seven distinct
aerosol chemical components for a rural boreal forest site: ammonium sulfate
(35±7&thinsp;% of mass), low and semi-volatile oxidised organic aerosols
(27±8&thinsp;% and 12±7&thinsp;%), biomass burning organic aerosol (11±7&thinsp;%), a nitrate-containing organic aerosol type (7±2&thinsp;%),
ammonium nitrate (5±2&thinsp;%), and hydrocarbon-like organic aerosol (3±1&thinsp;%). Some of the additionally observed, rare outlier aerosol types
likely emerge due to surface ionisation effects and likely represent amine
compounds from an unknown source and alkaline metals from emissions of a
nearby district heating plant. Compared to traditional, ion-balance-based
inorganics apportionment schemes for aerosol mass spectrometer data, our
statistics-based method provides an improved, more robust approach, yielding
readily useful information for the modelling of submicron atmospheric
aerosols physical and chemical properties. The results also shed light on the
division between organic and inorganic aerosol types and dynamics of salt
formation in aerosol. Equally importantly, the combined methodology
exemplifies an iterative analysis, using consequent analysis steps by a
combination of statistical methods. Such an approach offers new ways to home
in on physicochemically sensible solutions with minimal need for a priori
information or analyst interference. We therefore suggest that similar
statistics-based approaches offer significant potential for un- or semi-supervised machine-learning applications in future analyses of aerosol
mass spectrometric data.</p></abstract-html>
<ref-html id="bib1.bib1"><label>1</label><mixed-citation>
Äijälä, M., Heikkinen, L., Fröhlich, R., Canonaco, F.,
Prévôt, A. S. H., Junninen, H., Petäjä, T., Kulmala, M.,
Worsnop, D., and Ehn, M.: Resolving anthropogenic aerosol pollution types –
deconvolution and exploratory classification of pollution events, Atmos.
Chem. Phys., 17, 3165–3197, <a href="https://doi.org/10.5194/acp-17-3165-2017" target="_blank">https://doi.org/10.5194/acp-17-3165-2017</a>, 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>2</label><mixed-citation>
Äijälä, M., Daellenbach, K. R., Canonaco, F., Heikkinen, L.,
Junninen, H., Petäjä, T., Kulmala, M., Prévôt, A. S. H., and
Ehn, M.: Aerosol chemical composition results for SMEAR II 2008–2011 from
r-CMB model results, available at:
<a href="https://etsin.avointiede.fi/dataset/urn-nbn-fi-csc-kata20190319160233052956" target="_blank">https://etsin.avointiede.fi/dataset/urn-nbn-fi-csc-kata20190319160233052956</a>,
last access: 19 March 2019.
</mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>3</label><mixed-citation>
Aiken, A. C., DeCarlo, P. F., and Jimenez, J. L.: Elemental analysis of
organic species with electron ionization high-resolution mass spectrometry,
Anal. Chem., 79, 8350–8358, <a href="https://doi.org/10.1021/ac071150w" target="_blank">https://doi.org/10.1021/ac071150w</a>, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>4</label><mixed-citation>
Aiken, A. C., Decarlo, P. F., Kroll, J. H., Worsnop, D. R., Huffman, J. A.,
Docherty, K. S., Ulbrich, I. M., Mohr, C., Kimmel, J. R., Sueper, D., Sun,
Y., Zhang, Q., Trimborn, A., Northway, M., Ziemann, P. J., Canagaratna, M.
R., Onasch, T. B., Alfarra, M. R., Prevot, A. S., Dommen, J., Duplissy, J.,
Metzger, A., Baltensperger, U., and Jimenez, J. L.: O&thinsp;∕&thinsp;C and OM&thinsp;∕&thinsp;OC
ratios of primary, secondary, and ambient organic aerosols with
high-resolution time-of-flight aerosol mass spectrometry, Environ. Sci.
Technol., 42, 4478–4485, 2008.
</mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>5</label><mixed-citation>
Alfarra, M. R., Coe, H., Allan, J. D., Bower, K. N., Boudries, H.,
Canagaratna, M. R., Jimenez, J. L., Jayne, J. T., Garforth, A. A., Li, S. M.,
and Worsnop, D. R.: Characterization of urban and rural organic particulate
in the lower Fraser valley using two aerodyne aerosol mass spectrometers,
Atmos. Environ., 38, 5745–5758, <a href="https://doi.org/10.1016/j.atmosenv.2004.01.054" target="_blank">https://doi.org/10.1016/j.atmosenv.2004.01.054</a>, 2004.
</mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>6</label><mixed-citation>
Alfarra, M. R., Prevot, A. S., Szidat, S., Sandradewi, J., Weimer, S., Lanz,
V. A., Schreiber, D., Mohr, M., and Baltensperger, U.: Identification of the
mass spectral signature of organic aerosols from wood burning emissions,
Environ. Sci. Technol., 41, 5770–5777, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>7</label><mixed-citation>
Allan, J. D., Alfarra, M. R., Bower, K. N., Williams, P. I., Gallagher, M.
W., Jimenez, J. L., McDonald, A. G., Nemitz, E., Canagaratna, M. R., and
Jayne, J. T.: Quantitative sampling using an Aerodyne aerosol mass
spectrometer 2. Measurements of fine particulate chemical composition in two
UK cities, J. Geophys. Res.-Atmos., 108, 4091, <a href="https://doi.org/10.1029/2002JD002359" target="_blank">https://doi.org/10.1029/2002JD002359</a>,
2003a.
</mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>8</label><mixed-citation>
Allan, J. D., Jimenez, J. L., Williams, P. I., Alfarra, M. R., Bower, K. N.,
Jayne, J. T., Coe, H., and Worsnop, D. R.: Quantitative sampling using an
Aerodyne aerosol mass spectrometer 1. Techniques of data interpretation and
error analysis, J. Geophys. Res.-Atmos., 108, 4090,
<a href="https://doi.org/10.1029/2002JD002358" target="_blank">https://doi.org/10.1029/2002JD002358</a>, 2003b.
</mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>9</label><mixed-citation>
Allan, J. D., Delia, A. E., Coe, H., Bower, K. N., Alfarra, M. R., Jimenez,
J. L., Middlebrook, A. M., Drewnick, F., Onasch, T. B., and Canagaratna, M.
R.: A generalised method for the extraction of chemically resolved mass
spectra from Aerodyne aerosol mass spectrometer data, J. Aerosol Sci., 35,
909–922, 2004.
</mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>10</label><mixed-citation>
Allan, J. D., Alfarra, M. R., Bower, K. N., Coe, H., Jayne, J. T., Worsnop,
D. R., Aalto, P. P., Kulmala, M., Hyötyläinen, T., Cavalli, F., and
Laaksonen, A.: Size and composition measurements of background aerosol and
new particle growth in a Finnish forest during QUEST 2 using an Aerodyne
Aerosol Mass Spectrometer, Atmos. Chem. Phys., 6, 315–327,
<a href="https://doi.org/10.5194/acp-6-315-2006" target="_blank">https://doi.org/10.5194/acp-6-315-2006</a>, 2006.
</mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>11</label><mixed-citation>
Arthur, D. and Vassilvitskii, S.: <i>k</i>-means+ + : The advantages of careful
seeding, Proceedings of the eighteenth annual ACM-SIAM symposium on Discrete
algorithms, New Orleans, Louisiana, USA, 7–9 January 2007, 1027–1035, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>12</label><mixed-citation>
Bahreini, R., Keywood, M. D., Ng, N. L., Varutbangkul, V., Gao, S., Flagan,
R. C., Seinfeld, J. H., Worsnop, D. R., and Jimenez, J. L.: Measurements of
secondary organic aerosol from oxidation of cycloalkenes, terpenes, and
m-xylene using an Aerodyne aerosol mass spectrometer, Environ. Sci. Technol.,
39, 5674–5688, <a href="https://doi.org/10.1021/es048061a" target="_blank">https://doi.org/10.1021/es048061a</a>, 2005.
</mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>13</label><mixed-citation>
Ball, G. H. and Hall, D. J.: ISODATA, a novel method of data analysis and
pattern classification, DTIC Document, Technical report, Stanford research
institute, Menlo Park, CA, USA, 1965.
</mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>14</label><mixed-citation>
Berkemeier, T., Ammann, M., Mentel, T. F., Pöschl, U., and Shiraiwa, M.:
Organic nitrate contribution to new particle formation and growth in
secondary organic aerosols from <i>α</i>-pinene ozonolysis, Environ. Sci.
Technol., 50, 6334–6342, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>15</label><mixed-citation>
Bilde, M., Barsanti, K., Booth, M., Cappa, C. D., Donahue, N. M.,
Emanuelsson, E. U., McFiggans, G., Krieger, U. K., Marcolli, C., and Topping,
D.: Saturation vapor pressures and transition enthalpies of low-volatility
organic molecules of atmospheric relevance: from dicarboxylic acids to
complex mixtures, Chem. Rev., 115, 4115–4156, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>16</label><mixed-citation>
Brown, S. G., Eberly, S., Paatero, P., and Norris, G. A.: Methods for
estimating uncertainty in PMF solutions: Examples with ambient air and water
quality data and guidance on reporting PMF results, Sci. Total Environ., 518,
626–635, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>17</label><mixed-citation>
Burns, J. A. and Whitesides, G. M.: Feed-forward neural networks in
chemistry: mathematical systems for classification and pattern recognition,
Chem. Rev., 93, 2583–2601, 1993.
</mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>18</label><mixed-citation>
Canagaratna, M. R., Jayne, J. T., Ghertner, D. A., Herndon, S., Shi, Q.,
Jimenez, J. L., Silva, P. J., Williams, P., Lanni, T., Drewnick, F.,
Demerjian, K. L., Kolb, C. E., and Worsnop, D. R.: Chase studies of
particulate emissions from in-use New York City vehicles, Aerosol Sci. Tech.,
38, 555–573, <a href="https://doi.org/10.1080/02786820490465504" target="_blank">https://doi.org/10.1080/02786820490465504</a>, 2004.
</mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>19</label><mixed-citation>
Canagaratna, M. R., Jayne, J. T., Jimenez, J. L., Allan, J. D., Alfarra, M.
R., Zhang, Q., Onasch, T. B., Drewnick, F., Coe, H., Middlebrook, A., Delia,
A., Williams, L. R., Trimborn, A. M., Northway, M. J., DeCarlo, P. F., Kolb,
C. E., Davidovits, P., and Worsnop, D. R.: Chemical and microphysical
characterization of ambient aerosols with the aerodyne aerosol mass
spectrometer, Mass Spectrom. Rev., 26, 185–222, <a href="https://doi.org/10.1002/mas.20115" target="_blank">https://doi.org/10.1002/mas.20115</a>, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>20</label><mixed-citation>
Canonaco, F., Crippa, M., Slowik, J. G., Baltensperger, U., and
Prévôt, A. S. H.: SoFi, an IGOR-based interface for the efficient use
of the generalized multilinear engine (ME-2) for the source apportionment:
ME-2 application to aerosol mass spectrometer data, Atmos. Meas. Tech., 6,
3649–3661, <a href="https://doi.org/10.5194/amt-6-3649-2013" target="_blank">https://doi.org/10.5194/amt-6-3649-2013</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>21</label><mixed-citation>
Canonaco, F., Slowik, J. G., Baltensperger, U., and Prévôt, A. S. H.:
Seasonal differences in oxygenated organic aerosol composition: implications
for emissions sources and factor analysis, Atmos. Chem. Phys., 15,
6993–7002, <a href="https://doi.org/10.5194/acp-15-6993-2015" target="_blank">https://doi.org/10.5194/acp-15-6993-2015</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>22</label><mixed-citation>
Chirico, R., DeCarlo, P. F., Heringa, M. F., Tritscher, T., Richter, R.,
Prévôt, A. S. H., Dommen, J., Weingartner, E., Wehrle, G., Gysel, M.,
Laborde, M., and Baltensperger, U.: Impact of aftertreatment devices on
primary emissions and secondary organic aerosol formation potential from
in-use diesel vehicles: results from smog chamber experiments, Atmos. Chem.
Phys., 10, 11545–11563, <a href="https://doi.org/10.5194/acp-10-11545-2010" target="_blank">https://doi.org/10.5194/acp-10-11545-2010</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>23</label><mixed-citation>
Corrigan, A. L., Russell, L. M., Takahama, S., Äijälä, M., Ehn,
M., Junninen, H., Rinne, J., Petäjä, T., Kulmala, M., Vogel, A. L.,
Hoffmann, T., Ebben, C. J., Geiger, F. M., Chhabra, P., Seinfeld, J. H.,
Worsnop, D. R., Song, W., Auld, J., and Williams, J.: Biogenic and biomass
burning organic aerosol in a boreal forest at Hyytiälä, Finland,
during HUMPPA-COPEC 2010, Atmos. Chem. Phys., 13, 12233–12256,
<a href="https://doi.org/10.5194/acp-13-12233-2013" target="_blank">https://doi.org/10.5194/acp-13-12233-2013</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>24</label><mixed-citation>
Crippa, M., DeCarlo, P. F., Slowik, J. G., Mohr, C., Heringa, M. F., Chirico,
R., Poulain, L., Freutel, F., Sciare, J., Cozic, J., Di Marco, C. F.,
Elsasser, M., Nicolas, J. B., Marchand, N., Abidi, E., Wiedensohler, A.,
Drewnick, F., Schneider, J., Borrmann, S., Nemitz, E., Zimmermann, R.,
Jaffrezo, J.-L., Prévôt, A. S. H., and Baltensperger, U.: Wintertime
aerosol chemical composition and source apportionment of the organic fraction
in the metropolitan area of Paris, Atmos. Chem. Phys., 13, 961–981,
<a href="https://doi.org/10.5194/acp-13-961-2013" target="_blank">https://doi.org/10.5194/acp-13-961-2013</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>25</label><mixed-citation>
Crippa, M., Canonaco, F., Lanz, V. A., Äijälä, M., Allan, J. D.,
Carbone, S., Capes, G., Ceburnis, D., Dall'Osto, M., Day, D. A., DeCarlo, P.
F., Ehn, M., Eriksson, A., Freney, E., Hildebrandt Ruiz, L., Hillamo, R.,
Jimenez, J. L., Junninen, H., Kiendler-Scharr, A., Kortelainen, A.-M.,
Kulmala, M., Laaksonen, A., Mensah, A. A., Mohr, C., Nemitz, E., O'Dowd, C.,
Ovadnevaite, J., Pandis, S. N., Petäjä, T., Poulain, L., Saarikoski,
S., Sellegri, K., Swietlicki, E., Tiitta, P., Worsnop, D. R., Baltensperger,
U., and Prévôt, A. S. H.: Organic aerosol components derived from 25
AMS data sets across Europe using a consistent ME-2 based source
apportionment approach, Atmos. Chem. Phys., 14, 6159–6176,
<a href="https://doi.org/10.5194/acp-14-6159-2014" target="_blank">https://doi.org/10.5194/acp-14-6159-2014</a>, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>26</label><mixed-citation>
Cubison, M. J., Ortega, A. M., Hayes, P. L., Farmer, D. K., Day, D., Lechner,
M. J., Brune, W. H., Apel, E., Diskin, G. S., Fisher, J. A., Fuelberg, H. E.,
Hecobian, A., Knapp, D. J., Mikoviny, T., Riemer, D., Sachse, G. W.,
Sessions, W., Weber, R. J., Weinheimer, A. J., Wisthaler, A., and Jimenez, J.
L.: Effects of aging on organic aerosol from open biomass burning smoke in
aircraft and laboratory studies, Atmos. Chem. Phys., 11, 12049–12064,
<a href="https://doi.org/10.5194/acp-11-12049-2011" target="_blank">https://doi.org/10.5194/acp-11-12049-2011</a>, 2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>27</label><mixed-citation>
Daellenbach, K. R., Stefenelli, G., Bozzetti, C., Vlachou, A., Fermo, P.,
Gonzalez, R., Piazzalunga, A., Colombi, C., Canonaco, F., Hueglin, C.,
Kasper-Giebl, A., Jaffrezo, J.-L., Bianchi, F., Slowik, J. G., Baltensperger,
U., El-Haddad, I., and Prévôt, A. S. H.: Long-term chemical analysis
and organic aerosol source apportionment at nine sites in central Europe:
source identification and uncertainty assessment, Atmos. Chem. Phys., 17,
13265–13282, <a href="https://doi.org/10.5194/acp-17-13265-2017" target="_blank">https://doi.org/10.5194/acp-17-13265-2017</a>, 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>28</label><mixed-citation>
Drewnick, F., Hings, S. S., DeCarlo, P., Jayne, J. T., Gonin, M., Fuhrer, K.,
Weimer, S., Jimenez, J. L., Demerjian, K. L., Borrmann, S., and Worsnop, D.
R.: A new time-of-flight aerosol mass spectrometer (TOF-AMS) – Instrument
description and first field deployment, Aerosol Sci. Tech., 39, 637–658,
<a href="https://doi.org/10.1080/02786820500182040" target="_blank">https://doi.org/10.1080/02786820500182040</a>, 2005.
</mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>29</label><mixed-citation>
Drewnick, F., Diesch, J.-M., Faber, P., and Borrmann, S.: Aerosol mass
spectrometry: particle–vaporizer interactions and their consequences for the
measurements, Atmos. Meas. Tech., 8, 3811–3830,
<a href="https://doi.org/10.5194/amt-8-3811-2015" target="_blank">https://doi.org/10.5194/amt-8-3811-2015</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>30</label><mixed-citation>
Duplissy, J., DeCarlo, P. F., Dommen, J., Alfarra, M. R., Metzger, A.,
Barmpadimos, I., Prevot, A. S. H., Weingartner, E., Tritscher, T., Gysel, M.,
Aiken, A. C., Jimenez, J. L., Canagaratna, M. R., Worsnop, D. R., Collins, D.
R., Tomlinson, J., and Baltensperger, U.: Relating hygroscopicity and
composition of organic aerosol particulate matter, Atmos. Chem. Phys., 11,
1155–1165, <a href="https://doi.org/10.5194/acp-11-1155-2011" target="_blank">https://doi.org/10.5194/acp-11-1155-2011</a>, 2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>31</label><mixed-citation>
Elsasser, M., Crippa, M., Orasche, J., DeCarlo, P. F., Oster, M., Pitz, M.,
Cyrys, J., Gustafson, T. L., Pettersson, J. B. C., Schnelle-Kreis, J.,
Prévôt, A. S. H., and Zimmermann, R.: Organic molecular markers and
signature from wood combustion particles in winter ambient aerosols: aerosol
mass spectrometer (AMS) and high time-resolved GC-MS measurements in
Augsburg, Germany, Atmos. Chem. Phys., 12, 6113–6128,
<a href="https://doi.org/10.5194/acp-12-6113-2012" target="_blank">https://doi.org/10.5194/acp-12-6113-2012</a>, 2012.
</mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>32</label><mixed-citation>
Farmer, D. K., Matsunaga, A., Docherty, K. S., Surratt, J. D., Seinfeld, J.
H., Ziemann, P. J., and Jimenez, J. L.: Response of an aerosol mass
spectrometer to organonitrates and organosulfates and implications for
atmospheric chemistry, P. Natl. Acad. Sci. USA, 107, 6670–6675,
<a href="https://doi.org/10.1073/pnas.0912340107" target="_blank">https://doi.org/10.1073/pnas.0912340107</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>33</label><mixed-citation>
Fortier, J. and Solomon, H.: Clustering procedures, in: Multivariate
Analysis, edited by: Krishnaiah, P. R., 493–506, Academic Press, New York,
USA, 1966.
</mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>34</label><mixed-citation>
Fountoukis, C. and Nenes, A.: ISORROPIA II: a computationally efficient
thermodynamic equilibrium model for
K<sup>+</sup>–Ca<sup>2+</sup>–Mg<sup>2+</sup>–NH<sub>4</sub><sup>+</sup>–Na<sup>+</sup>–SO<sub>4</sub><sup>2−</sup>–NO<sub>3</sub><sup>−</sup>–Cl<sup>−</sup>–H<sub>2</sub>O
aerosols, Atmos. Chem. Phys., 7, 4639–4659,
<a href="https://doi.org/10.5194/acp-7-4639-2007" target="_blank">https://doi.org/10.5194/acp-7-4639-2007</a>, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>35</label><mixed-citation>
Freutel, F., Drewnick, F., Schneider, J., Klimach, T., and Borrmann, S.:
Quantitative single-particle analysis with the Aerodyne aerosol mass
spectrometer: development of a new classification algorithm and its
application to field data, Atmos. Meas. Tech., 6, 3131–3145,
<a href="https://doi.org/10.5194/amt-6-3131-2013" target="_blank">https://doi.org/10.5194/amt-6-3131-2013</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>36</label><mixed-citation>
Friedlander, S. K.: Chemical element balances and identification of air
pollution sources, Environ. Sci. Technol., 7, 235–240, 1973.
</mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>37</label><mixed-citation>
Gasteiger, J. and Zupan, J.: Neural networks in chemistry, Angew. Chem. Int.
Edit., 32, 503–527, 1993.
</mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>38</label><mixed-citation>
Gordon, G. E.: Receptor models, Environ. Sci. Technol., 22, 1132–1142, 1988.
</mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>39</label><mixed-citation>
Gysel, M., Crosier, J., Topping, D. O., Whitehead, J. D., Bower, K. N.,
Cubison, M. J., Williams, P. I., Flynn, M. J., McFiggans, G. B., and Coe, H.:
Closure study between chemical composition and hygroscopic growth of aerosol
particles during TORCH2, Atmos. Chem. Phys., 7, 6131–6144,
<a href="https://doi.org/10.5194/acp-7-6131-2007" target="_blank">https://doi.org/10.5194/acp-7-6131-2007</a>, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>40</label><mixed-citation>
Hao, L. Q., Kortelainen, A., Romakkaniemi, S., Portin, H., Jaatinen, A.,
Leskinen, A., Komppula, M., Miettinen, P., Sueper, D., Pajunoja, A., Smith,
J. N., Lehtinen, K. E. J., Worsnop, D. R., Laaksonen, A., and Virtanen, A.:
Atmospheric submicron aerosol composition and particulate organic nitrate
formation in a boreal forestland–urban mixed region, Atmos. Chem. Phys., 14,
13483–13495, <a href="https://doi.org/10.5194/acp-14-13483-2014" target="_blank">https://doi.org/10.5194/acp-14-13483-2014</a>, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>41</label><mixed-citation>
Hari, P. and Kulmala, M.: Station for measuring ecosystem-atmosphere
relations (SMEAR II), Boreal Environ. Res., 10, 315–322, 2005.
</mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>42</label><mixed-citation>
Haynes, W. M.: CRC handbook of chemistry and physics, CRC press, Boca Raton,
FL, USA, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>43</label><mixed-citation>
Hersey, S. P., Craven, J. S., Schilling, K. A., Metcalf, A. R., Sorooshian,
A., Chan, M. N., Flagan, R. C., and Seinfeld, J. H.: The Pasadena Aerosol
Characterization Observatory (PACO): chemical and physical analysis of the
Western Los Angeles basin aerosol, Atmos. Chem. Phys., 11, 7417–7443,
<a href="https://doi.org/10.5194/acp-11-7417-2011" target="_blank">https://doi.org/10.5194/acp-11-7417-2011</a>, 2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>44</label><mixed-citation>
Hoffmann, D., Tilgner, A., Iinuma, Y., and Herrmann, H.: Atmospheric
stability of levoglucosan: a detailed laboratory and modeling study, Environ.
Sci. Technol., 44, 694–699, 2009.
</mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>45</label><mixed-citation>
Hong, J., Äijälä, M., Häme, S. A. K., Hao, L., Duplissy, J.,
Heikkinen, L. M., Nie, W., Mikkilä, J., Kulmala, M., Prisle, N. L.,
Virtanen, A., Ehn, M., Paasonen, P., Worsnop, D. R., Riipinen, I.,
Petäjä, T., and Kerminen, V.-M.: Estimates of the organic aerosol
volatility in a boreal forest using two independent methods, Atmos. Chem.
Phys., 17, 4387–4399, <a href="https://doi.org/10.5194/acp-17-4387-2017" target="_blank">https://doi.org/10.5194/acp-17-4387-2017</a>, 2017.
</mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>46</label><mixed-citation>
Hopke, P. K.: Receptor modeling for air quality management, Elsevier,
Amsterdam, the Netherlands, 1991.
</mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>47</label><mixed-citation>
Hopke, P. K.: Review of receptor modeling methods for source apportionment,
J. Air Waste Manage., 66, 237–259, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>48</label><mixed-citation>
Horai, H., Arita, M., Kanaya, S., Nihei, Y., Ikeda, T., Suwa, K., Ojima, Y.,
Tanaka, K., Tanaka, S., Aoshima, K., Oda, Y., Kakazu, Y., Kusano, M., Tohge,
T., Matsuda, F., Sawada, Y., Hirai, M. Y., Nakanishi, H., Ikeda, K., Akimoto,
N., Maoka, T., Takahashi, H., Ara, T., Sakurai, N., Suzuki, H., Shibata, D.,
Neumann, S., Iida, T., Tanaka, K., Funatsu, K., Matsuura, F., Soga, T.,
Taguchi, R., Saito, K., and Nishioka, T.: MassBank: a public repository for
sharing mass spectral data for life sciences, J. Mass Spectrom., 45,
703–714, <a href="https://doi.org/10.1002/jms.1777" target="_blank">https://doi.org/10.1002/jms.1777</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>49</label><mixed-citation>
Irei, S., Shimono, A., Hikida, T., Kuramoto, K., Suzuki, Y., and Takami, A.:
Qualitative evaluation of <i>m</i>∕<i>z</i> 85, 87, and 133 signals in organic aerosol
mass spectra of fly ash produced by coal combustion, Aerosol Air Qual. Res.,
14, 406–412, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>50</label><mixed-citation>
Jain, A. K.: Data clustering: 50 years beyond K-means, Pattern Recogn. Lett.,
31, 651–666, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib51"><label>51</label><mixed-citation>
Jimenez, J. L., Canagaratna, M. R., Donahue, N. M., Prevot, A. S., Zhang, Q.,
Kroll, J. H., DeCarlo, P. F., Allan, J. D., Coe, H., Ng, N. L., Aiken, A. C.,
Docherty, K. S., Ulbrich, I. M., Grieshop, A. P., Robinson, A. L., Duplissy,
J., Smith, J. D., Wilson, K. R., Lanz, V. A., Hueglin, C., Sun, Y. L., Tian,
J., Laaksonen, A., Raatikainen, T., Rautiainen, J., Vaattovaara, P., Ehn, M.,
Kulmala, M., Tomlinson, J. M., Collins, D. R., Cubison, M. J., Dunlea, E. J.,
Huffman, J. A., Onasch, T. B., Alfarra, M. R., Williams, P. I., Bower, K.,
Kondo, Y., Schneider, J., Drewnick, F., Borrmann, S., Weimer, S., Demerjian,
K., Salcedo, D., Cottrell, L., Griffin, R., Takami, A., Miyoshi, T.,
Hatakeyama, S., Shimono, A., Sun, J. Y., Zhang, Y. M., Dzepina, K., Kimmel,
J. R., Sueper, D., Jayne, J. T., Herndon, S. C., Trimborn, A. M., Williams,
L. R., Wood, E. C., Middlebrook, A. M., Kolb, C. E., Baltensperger, U., and
Worsnop, D. R.: Evolution of organic aerosols in the atmosphere, Science,
326, 1525–1529, <a href="https://doi.org/10.1126/science.1180353" target="_blank">https://doi.org/10.1126/science.1180353</a>, 2009.
</mixed-citation></ref-html>
<ref-html id="bib1.bib52"><label>52</label><mixed-citation>
Kiendler-Scharr, A., Mensah, A. A., Friese, E., Topping, D., Nemitz, E.,
Prevot, A., Äijälä, M., Allan, J., Canonaco, F., and Canagaratna,
M.: Ubiquity of organic nitrates from nighttime chemistry in the European
submicron aerosol, Geophys. Res. Lett., 43, 7735–7744, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib53"><label>53</label><mixed-citation>
Kim, S., Koo, I., Wei, X., and Zhang, X.: A method of finding optimal weight
factors for compound identification in gas chromatography-mass spectrometry,
Bioinformatics, 28, 1158–1163, <a href="https://doi.org/10.1093/bioinformatics/bts083" target="_blank">https://doi.org/10.1093/bioinformatics/bts083</a>, 2012.
</mixed-citation></ref-html>
<ref-html id="bib1.bib54"><label>54</label><mixed-citation>
Kowalski, B. R.: Measurement analysis by pattern recognition, Anal. Chem.,
47, 1152A–1162a, 1975.
</mixed-citation></ref-html>
<ref-html id="bib1.bib55"><label>55</label><mixed-citation>
Kroll, J. H. and Seinfeld, J. H.: Chemistry of secondary organic aerosol:
Formation and evolution of low-volatility organics in the atmosphere, Atmos.
Environ., 42, 3593–3624, 2008.
</mixed-citation></ref-html>
<ref-html id="bib1.bib56"><label>56</label><mixed-citation>
Kulmala, M., Rannik, Ü., Pirjola, L., Dal Maso, M., Karimäki, J.,
Asmi, A., Jäppinen, A., Karhu, V., Korhonen, H., and Malvikko, S.-P.:
Characterization of atmospheric trace gas and aerosol concentrations at
forest sites in southern and northern Finland using back trajectories, Boreal
Environ. Res., 5, 315–336, 2000.
</mixed-citation></ref-html>
<ref-html id="bib1.bib57"><label>57</label><mixed-citation>
Kulmala, M., Asmi, A., Lappalainen, H. K., Carslaw, K. S., Pöschl, U.,
Baltensperger, U., Hov, Ø., Brenquier, J.-L., Pandis, S. N., Facchini, M.
C., Hansson, H.-C., Wiedensohler, A., and O'Dowd, C. D.: Introduction:
European Integrated Project on Aerosol Cloud Climate and Air Quality
interactions (EUCAARI) – integrating aerosol research from nano to global
scales, Atmos. Chem. Phys., 9, 2825–2841,
<a href="https://doi.org/10.5194/acp-9-2825-2009" target="_blank">https://doi.org/10.5194/acp-9-2825-2009</a>, 2009.
</mixed-citation></ref-html>
<ref-html id="bib1.bib58"><label>58</label><mixed-citation>
Kulmala, M., Asmi, A., Lappalainen, H. K., Baltensperger, U., Brenguier,
J.-L., Facchini, M. C., Hansson, H.-C., Hov, Ø., O'Dowd, C. D.,
Pöschl, U., Wiedensohler, A., Boers, R., Boucher, O., de Leeuw, G.,
Denier van der Gon, H. A. C., Feichter, J., Krejci, R., Laj, P., Lihavainen,
H., Lohmann, U., McFiggans, G., Mentel, T., Pilinis, C., Riipinen, I.,
Schulz, M., Stohl, A., Swietlicki, E., Vignati, E., Alves, C., Amann, M.,
Ammann, M., Arabas, S., Artaxo, P., Baars, H., Beddows, D. C. S.,
Bergström, R., Beukes, J. P., Bilde, M., Burkhart, J. F., Canonaco, F.,
Clegg, S. L., Coe, H., Crumeyrolle, S., D'Anna, B., Decesari, S., Gilardoni,
S., Fischer, M., Fjaeraa, A. M., Fountoukis, C., George, C., Gomes, L.,
Halloran, P., Hamburger, T., Harrison, R. M., Herrmann, H., Hoffmann, T.,
Hoose, C., Hu, M., Hyvärinen, A., Hõrrak, U., Iinuma, Y., Iversen,
T., Josipovic, M., Kanakidou, M., Kiendler-Scharr, A., Kirkevåg, A.,
Kiss, G., Klimont, Z., Kolmonen, P., Komppula, M., Kristjánsson, J.-E.,
Laakso, L., Laaksonen, A., Labonnote, L., Lanz, V. A., Lehtinen, K. E. J.,
Rizzo, L. V., Makkonen, R., Manninen, H. E., McMeeking, G., Merikanto, J.,
Minikin, A., Mirme, S., Morgan, W. T., Nemitz, E., O'Donnell, D., Panwar, T.
S., Pawlowska, H., Petzold, A., Pienaar, J. J., Pio, C., Plass-Duelmer, C.,
Prévôt, A. S. H., Pryor, S., Reddington, C. L., Roberts, G.,
Rosenfeld, D., Schwarz, J., Seland, Ø., Sellegri, K., Shen, X. J.,
Shiraiwa, M., Siebert, H., Sierau, B., Simpson, D., Sun, J. Y., Topping, D.,
Tunved, P., Vaattovaara, P., Vakkari, V., Veefkind, J. P., Visschedijk, A.,
Vuollekoski, H., Vuolo, R., Wehner, B., Wildt, J., Woodward, S., Worsnop, D.
R., van Zadelhoff, G.-J., Zardini, A. A., Zhang, K., van Zyl, P. G.,
Kerminen, V.-M., S Carslaw, K., and Pandis, S. N.: General overview: European
Integrated project on Aerosol Cloud Climate and Air Quality interactions
(EUCAARI) – integrating aerosol research from nano to global scales, Atmos.
Chem. Phys., 11, 13061–13143, <a href="https://doi.org/10.5194/acp-11-13061-2011" target="_blank">https://doi.org/10.5194/acp-11-13061-2011</a>,
2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib59"><label>59</label><mixed-citation>
Lanz, V. A., Alfarra, M. R., Baltensperger, U., Buchmann, B., Hueglin, C.,
and Prévôt, A. S. H.: Source apportionment of submicron organic
aerosols at an urban site by factor analytical modelling of aerosol mass
spectra, Atmos. Chem. Phys., 7, 1503–1522,
<a href="https://doi.org/10.5194/acp-7-1503-2007" target="_blank">https://doi.org/10.5194/acp-7-1503-2007</a>, 2007a.
</mixed-citation></ref-html>
<ref-html id="bib1.bib60"><label>60</label><mixed-citation>
Lanz, V. A., Alfarra, M. R., Baltensperger, U., Buchmann, B., Hueglin, C.,
Szidat, S., Wehrli, M. N., Wacker, L., Weimer, S., and Caseiro, A.: Source
attribution of submicron organic aerosols during wintertime inversions by
advanced factor analysis of aerosol mass spectra, Environ. Sci. Technol., 42,
214–220, 2007b.
</mixed-citation></ref-html>
<ref-html id="bib1.bib61"><label>61</label><mixed-citation>
Lee, B. H., Mohr, C., Lopez-Hilfiker, F. D., Lutz, A., Hallquist, M., Lee,
L., Romer, P., Cohen, R. C., Iyer, S., and Kurtén, T.: Highly
functionalized organic nitrates in the southeast United States: Contribution
to secondary organic aerosol and reactive nitrogen budgets, P. Natl. Acad.
Sci. USA, 113, 1516–1521, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib62"><label>62</label><mixed-citation>
Li, J., Pósfai, M., Hobbs, P. V., and Buseck, P. R.: Individual aerosol
particles from biomass burning in southern Africa: 2. Compositions and aging
of inorganic particles, J. Geophys. Res.-Atmos., 108, 8484,
<a href="https://doi.org/10.1029/2002JD002310" target="_blank">https://doi.org/10.1029/2002JD002310</a>, 2003.
</mixed-citation></ref-html>
<ref-html id="bib1.bib63"><label>63</label><mixed-citation>
Liang, Z., Chen, L., Alam, M. S., Rezaei, S. Z., Stark, C., Xu, H., and
Harrison, R. M.: Comprehensive chemical characterization of lubricating oils
used in modern vehicular engines utilizing GC × GC-TOFMS, Fuel, 220,
792–799, 2018.
</mixed-citation></ref-html>
<ref-html id="bib1.bib64"><label>64</label><mixed-citation>
Lindon, J. C., Tranter, G. E., and Koppenaal, D.: Encyclopedia of
spectroscopy and spectrometry, Academic Press, San Diego, USA, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib65"><label>65</label><mixed-citation>
Liu, P. S., Deng, R., Smith, K. A., Williams, L. R., Jayne, J. T.,
Canagaratna, M. R., Moore, K., Onasch, T. B., Worsnop, D. R., and Deshler,
T.: Transmission efficiency of an aerodynamic focusing lens system:
Comparison of model calculations and laboratory measurements for the Aerodyne
Aerosol Mass Spectrometer, Aerosol Sci. Tech., 41, 721–733, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib66"><label>66</label><mixed-citation>
MacQueen, J.: Some methods for classification and analysis of multivariate
observations, Proceedings of the fifth Berkeley symposium on mathematical
statistics and probability, 21 June–18 July 1965 and 27 December
1965–7 January 1966, Statistical Laboratory of the University of California,
Berkeley, USA, 281–297, 1967.
</mixed-citation></ref-html>
<ref-html id="bib1.bib67"><label>67</label><mixed-citation>
Mclafferty, F. W.: Mass Spectrometric Analysis – Molecular Rearrangements,
Anal. Chem., 31, 82–87, <a href="https://doi.org/10.1021/ac60145a015" target="_blank">https://doi.org/10.1021/ac60145a015</a>, 1959.
</mixed-citation></ref-html>
<ref-html id="bib1.bib68"><label>68</label><mixed-citation>
McLafferty, F. W. and Turecek, F.: Interpretation of mass spectra, University
science books, Mill Valley, CA, USA, 1993.
</mixed-citation></ref-html>
<ref-html id="bib1.bib69"><label>69</label><mixed-citation>
Mcquitty, L. L.: Similarity Analysis by Reciprocal Pairs for Discrete and
Continuous Data, Educ. Psychol. Meas., 26, 825–831,
<a href="https://doi.org/10.1177/001316446602600402" target="_blank">https://doi.org/10.1177/001316446602600402</a>, 1966.
</mixed-citation></ref-html>
<ref-html id="bib1.bib70"><label>70</label><mixed-citation>
Miller, M., Friedlander, S., and Hidy, G.: A chemical element balance for the
Pasadena aerosol, in: Aerosols and atmospheric chemistry, Academic Press, New
York, USA, 301–312, 1972.
</mixed-citation></ref-html>
<ref-html id="bib1.bib71"><label>71</label><mixed-citation>
Mohr, C., Huffman, A., Cubison, M. J., Aiken, A. C., Docherty, K. S., Kimmel,
J. R., Ulbrich, I. M., Hannigan, M., and Jimenez, J. L.: Characterization of
primary organic aerosol emissions from meat cooking, trash burning, and motor
vehicles with high-resolution aerosol mass spectrometry and comparison with
ambient and chamber observations, Environ. Sci. Technol., 43, 2443–2449,
2009.
</mixed-citation></ref-html>
<ref-html id="bib1.bib72"><label>72</label><mixed-citation>
Mohr, C., DeCarlo, P. F., Heringa, M. F., Chirico, R., Slowik, J. G.,
Richter, R., Reche, C., Alastuey, A., Querol, X., Seco, R., Peñuelas, J.,
Jiménez, J. L., Crippa, M., Zimmermann, R., Baltensperger, U., and
Prévôt, A. S. H.: Identification and quantification of organic
aerosol from cooking and other sources in Barcelona using aerosol mass
spectrometer data, Atmos. Chem. Phys., 12, 1649–1665,
<a href="https://doi.org/10.5194/acp-12-1649-2012" target="_blank">https://doi.org/10.5194/acp-12-1649-2012</a>, 2012.
</mixed-citation></ref-html>
<ref-html id="bib1.bib73"><label>73</label><mixed-citation>
Murphy, S. M., Sorooshian, A., Kroll, J. H., Ng, N. L., Chhabra, P., Tong,
C., Surratt, J. D., Knipping, E., Flagan, R. C., and Seinfeld, J. H.:
Secondary aerosol formation from atmospheric reactions of aliphatic amines,
Atmos. Chem. Phys., 7, 2313–2337, <a href="https://doi.org/10.5194/acp-7-2313-2007" target="_blank">https://doi.org/10.5194/acp-7-2313-2007</a>,
2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib74"><label>74</label><mixed-citation>
Ng, N. L., Canagaratna, M. R., Zhang, Q., Jimenez, J. L., Tian, J., Ulbrich,
I. M., Kroll, J. H., Docherty, K. S., Chhabra, P. S., Bahreini, R., Murphy,
S. M., Seinfeld, J. H., Hildebrandt, L., Donahue, N. M., DeCarlo, P. F.,
Lanz, V. A., Prévôt, A. S. H., Dinar, E., Rudich, Y., and Worsnop, D.
R.: Organic aerosol components observed in Northern Hemispheric datasets from
Aerosol Mass Spectrometry, Atmos. Chem. Phys., 10, 4625–4641,
<a href="https://doi.org/10.5194/acp-10-4625-2010" target="_blank">https://doi.org/10.5194/acp-10-4625-2010</a>, 2010.
</mixed-citation></ref-html>
<ref-html id="bib1.bib75"><label>75</label><mixed-citation>
Ng, N. L., Canagaratna, M. R., Jimenez, J. L., Zhang, Q., Ulbrich, I. M., and
Worsnop, D. R.: Real-time methods for estimating organic component mass
concentrations from aerosol mass spectrometer data, Environ. Sci. Technol.,
45, 910–916, <a href="https://doi.org/10.1021/es102951k" target="_blank">https://doi.org/10.1021/es102951k</a>, 2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib76"><label>76</label><mixed-citation>
Niemi, J. V., Saarikoski, S., Aurela, M., Tervahattu, H., Hillamo, R.,
Westphal, D. L., Aarnio, P., Koskentalo, T., Makkonen, U., Vehkamaki, H., and
Kulmala, M.: Long-range transport episodes of fine particles in southern
Finland during 1999–2007, Atmos. Environ., 43, 1255–1264,
<a href="https://doi.org/10.1016/j.atmosenv.2008.11.022" target="_blank">https://doi.org/10.1016/j.atmosenv.2008.11.022</a>, 2009.
</mixed-citation></ref-html>
<ref-html id="bib1.bib77"><label>77</label><mixed-citation>
Orlando, J. J. and Tyndall, G. S.: Laboratory studies of organic peroxy
radical chemistry: an overview with emphasis on recent issues of atmospheric
significance, Chem. Soc. Rev., 41, 6294–6317, 2012.
</mixed-citation></ref-html>
<ref-html id="bib1.bib78"><label>78</label><mixed-citation>
Osborne, J. W., Costello, A. B., and Kellow, J. T.: Best practices in
exploratory factor analysis, CreateSpace Independent Publishing Platform,
Charleston, SC, USA, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib79"><label>79</label><mixed-citation>
Paatero, P.: Least squares formulation of robust non-negative factor
analysis, Chemometr. Intell. Lab., 37, 23–35,
<a href="https://doi.org/10.1016/S0169-7439(96)00044-5" target="_blank">https://doi.org/10.1016/S0169-7439(96)00044-5</a>, 1997.
</mixed-citation></ref-html>
<ref-html id="bib1.bib80"><label>80</label><mixed-citation>
Paatero, P.: The multilinear engine – A table-driven, least squares program
for solving multilinear problems, including the n-way parallel factor
analysis model, J. Comput. Graph. Stat., 8, 854–888, <a href="https://doi.org/10.2307/1390831" target="_blank">https://doi.org/10.2307/1390831</a>,
1999.
</mixed-citation></ref-html>
<ref-html id="bib1.bib81"><label>81</label><mixed-citation>
Paatero, P.: User's guide for positive matrix factorization programs PMF2 and
PMF3, University of Helsinki, Helsinki, Finland, 2000.
</mixed-citation></ref-html>
<ref-html id="bib1.bib82"><label>82</label><mixed-citation>
Paatero, P. and Tapper, U.: Positive matrix factorization: A non-negative
factor model with optimal utilization of error estimates of data values,
Environmetrics, 5, 111–126, 1994.
</mixed-citation></ref-html>
<ref-html id="bib1.bib83"><label>83</label><mixed-citation>
Patokoski, J., Ruuskanen, T. M., Kajos, M. K., Taipale, R., Rantala, P.,
Aalto, J., Ryyppö, T., Nieminen, T., Hakola, H., and Rinne, J.: Sources
of long-lived atmospheric VOCs at the rural boreal forest site, SMEAR II,
Atmos. Chem. Phys., 15, 13413–13432,
<a href="https://doi.org/10.5194/acp-15-13413-2015" target="_blank">https://doi.org/10.5194/acp-15-13413-2015</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib84"><label>84</label><mixed-citation>
Peräkylä, O., Vogt, M., Tikkanen, O.-P., Laurila, T., Kajos, M. K.,
Rantala, P. A., Patokoski, J., Aalto, J., Yli-Juuti, T., and Ehn, M.:
Monoterpenes' oxidation capacity and rate over a boreal forest (suppl. B),
Boreal Environ. Res., 19, 293–310, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib85"><label>85</label><mixed-citation>
Pieber, S. M., El Haddad, I., Slowik, J. G., Canagaratna, M. R., Jayne, J.
T., Platt, S. M., Bozzetti, C., Daellenbach, K. R., Fröhlich, R., and
Vlachou, A.: Inorganic salt interference on CO<sub>2</sub><sup>+</sup> in aerodyne AMS
and ACSM organic aerosol composition studies, Environ. Sci. Technol., 50,
10494–10503, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib86"><label>86</label><mixed-citation>
Rasulev, U. K. and Zandberg, E. Y.: Surface ionization of organic compounds
and its applications, Prog. Surf. Sci., 28, 181–412, 1988.
</mixed-citation></ref-html>
<ref-html id="bib1.bib87"><label>87</label><mixed-citation>
Rebotier, T. P. and Prather, K. A.: Aerosol time-of-flight mass spectrometry
data analysis: a benchmark of clustering algorithms, Anal. Chim. Acta, 585,
38–54, <a href="https://doi.org/10.1016/j.aca.2006.12.009" target="_blank">https://doi.org/10.1016/j.aca.2006.12.009</a>, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib88"><label>88</label><mixed-citation>
Reilly, P. and Wood, R. H.: Prediction of the properties of mixed
electrolytes from measurements on common ion mixtures, J. Phys. Chem., 73,
4292–4297, 1969.
</mixed-citation></ref-html>
<ref-html id="bib1.bib89"><label>89</label><mixed-citation>
Robinson, N. H., Hamilton, J. F., Allan, J. D., Langford, B., Oram, D. E.,
Chen, Q., Docherty, K., Farmer, D. K., Jimenez, J. L., Ward, M. W., Hewitt,
C. N., Barley, M. H., Jenkin, M. E., Rickard, A. R., Martin, S. T.,
McFiggans, G., and Coe, H.: Evidence for a significant proportion of
Secondary Organic Aerosol from isoprene above a maritime tropical forest,
Atmos. Chem. Phys., 11, 1039–1050, <a href="https://doi.org/10.5194/acp-11-1039-2011" target="_blank">https://doi.org/10.5194/acp-11-1039-2011</a>,
2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib90"><label>90</label><mixed-citation>
Rousseeuw, P. J.: Silhouettes – a Graphical Aid to the Interpretation and
Validation of Cluster-Analysis, J. Comput. Appl. Math., 20, 53–65,
<a href="https://doi.org/10.1016/0377-0427(87)90125-7" target="_blank">https://doi.org/10.1016/0377-0427(87)90125-7</a>, 1987.
</mixed-citation></ref-html>
<ref-html id="bib1.bib91"><label>91</label><mixed-citation>
Schneider, J., Weimer, S., Drewnick, F., Borrmann, S., Helas, G., Gwaze, P.,
Schmid, O., Andreae, M. O., and Kirchner, U.: Mass spectrometric analysis and
aerodynamic properties of various types of combustion-related aerosol
particles, Int. J. Mass Spectrom., 258, 37–49,
<a href="https://doi.org/10.1016/j.ijms.2006.07.008" target="_blank">https://doi.org/10.1016/j.ijms.2006.07.008</a>, 2006.
</mixed-citation></ref-html>
<ref-html id="bib1.bib92"><label>92</label><mixed-citation>
Shafizadeh, F.: The chemistry of pyrolysis and combustion, The chemistry of
solid wood, in: Advances in Chemistry Series, edited by: Rowell, R. M.,
Number 207, North American Chemical Society, Washington, D.C., USA, 489–529,
1984.
</mixed-citation></ref-html>
<ref-html id="bib1.bib93"><label>93</label><mixed-citation>
Sofowote, U. M., Su, Y., Dabek-Zlotorzynska, E., Rastogi, A. K., Brook, J.,
and Hopke, P. K.: Constraining the factor analytical solutions obtained from
multiple-year receptor modeling of ambient PM<sub>2.5</sub> data from five
speciation sites in Ontario, Canada, Atmos. Environ., 108, 151–157, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib94"><label>94</label><mixed-citation>
Sogacheva, L., Dal Maso, M., Kerminen, V.-M., and Kulmala, M.: Probability of
nucleation events and aerosol particle concentration in different air mass
types arriving at Hyytiälä, southern Finland, based on back
trajectories analysis, Boreal Environ. Res., 10, 479–491, 2005.
</mixed-citation></ref-html>
<ref-html id="bib1.bib95"><label>95</label><mixed-citation>
Stein, S. E. and Scott, D. R.: Optimization and testing of mass spectral
library search algorithms for compound identification, J. Am. Soc. Mass
Spectrom., 5, 859–866, <a href="https://doi.org/10.1016/1044-0305(94)87009-8" target="_blank">https://doi.org/10.1016/1044-0305(94)87009-8</a>, 1994.
</mixed-citation></ref-html>
<ref-html id="bib1.bib96"><label>96</label><mixed-citation>
Steinhaus, H.: Sur la division des corp materiels en parties, Bull. Acad.
Polon. Sci., 1, 801–804, 1956.
</mixed-citation></ref-html>
<ref-html id="bib1.bib97"><label>97</label><mixed-citation>
Sun, Y. L., Zhang, Q., Schwab, J. J., Yang, T., Ng, N. L., and Demerjian, K.
L.: Factor analysis of combined organic and inorganic aerosol mass spectra
from high resolution aerosol mass spectrometer measurements, Atmos. Chem.
Phys., 12, 8537–8551, <a href="https://doi.org/10.5194/acp-12-8537-2012" target="_blank">https://doi.org/10.5194/acp-12-8537-2012</a>, 2012.
</mixed-citation></ref-html>
<ref-html id="bib1.bib98"><label>98</label><mixed-citation>
Swietlicki, E., Hansson, H.-C., Hämeri, K., Svenningsson, B., Massling,
A., McFiggans, G., McMurry, P., Petäjä, T., Tunved, P., and Gysel,
M.: Hygroscopic properties of submicrometer atmospheric aerosol particles
measured with H-TDMA instruments in various environments – a review, Tellus
B, 60, 432–469, 2008.
</mixed-citation></ref-html>
<ref-html id="bib1.bib99"><label>99</label><mixed-citation>
Takami, A., Miyoshi, T., Shimono, A., Kaneyasu, N., Kato, S., Kajii, Y., and
Hatakeyama, S.: Transport of anthropogenic aerosols from Asia and subsequent
chemical transformation, J. Geophys. Res.-Atmos., 112, D22S31,
<a href="https://doi.org/10.1029/2006JD008120" target="_blank">https://doi.org/10.1029/2006JD008120</a>, 2007.
</mixed-citation></ref-html>
<ref-html id="bib1.bib100"><label>100</label><mixed-citation>
Ulbrich, I. M., Canagaratna, M. R., Zhang, Q., Worsnop, D. R., and Jimenez,
J. L.: Interpretation of organic components from Positive Matrix
Factorization of aerosol mass spectrometric data, Atmos. Chem. Phys., 9,
2891–2918, <a href="https://doi.org/10.5194/acp-9-2891-2009" target="_blank">https://doi.org/10.5194/acp-9-2891-2009</a>, 2009.
</mixed-citation></ref-html>
<ref-html id="bib1.bib101"><label>101</label><mixed-citation>
Vogel, A. L., Äijälä, M., Corrigan, A. L., Junninen, H., Ehn, M.,
Petäjä, T., Worsnop, D. R., Kulmala, M., Russell, L. M., Williams,
J., and Hoffmann, T.: In situ submicron organic aerosol characterization at a
boreal forest research station during HUMPPA-COPEC 2010 using soft and hard
ionization mass spectrometry, Atmos. Chem. Phys., 13, 10933–10950,
<a href="https://doi.org/10.5194/acp-13-10933-2013" target="_blank">https://doi.org/10.5194/acp-13-10933-2013</a>, 2013.
</mixed-citation></ref-html>
<ref-html id="bib1.bib102"><label>102</label><mixed-citation>
Williams, J., Crowley, J., Fischer, H., Harder, H., Martinez, M.,
Petäjä, T., Rinne, J., Bäck, J., Boy, M., Dal Maso, M., Hakala,
J., Kajos, M., Keronen, P., Rantala, P., Aalto, J., Aaltonen, H., Paatero,
J., Vesala, T., Hakola, H., Levula, J., Pohja, T., Herrmann, F., Auld, J.,
Mesarchaki, E., Song, W., Yassaa, N., Nölscher, A., Johnson, A. M.,
Custer, T., Sinha, V., Thieser, J., Pouvesle, N., Taraborrelli, D., Tang, M.
J., Bozem, H., Hosaynali-Beygi, Z., Axinte, R., Oswald, R., Novelli, A.,
Kubistin, D., Hens, K., Javed, U., Trawny, K., Breitenberger, C., Hidalgo, P.
J., Ebben, C. J., Geiger, F. M., Corrigan, A. L., Russell, L. M., Ouwersloot,
H. G., Vilà-Guerau de Arellano, J., Ganzeveld, L., Vogel, A., Beck, M.,
Bayerle, A., Kampf, C. J., Bertelmann, M., Köllner, F., Hoffmann, T.,
Valverde, J., González, D., Riekkola, M.-L., Kulmala, M., and Lelieveld,
J.: The summertime Boreal forest field measurement intensive
(HUMPPA-COPEC-2010): an overview of meteorological and chemical influences,
Atmos. Chem. Phys., 11, 10599–10618,
<a href="https://doi.org/10.5194/acp-11-10599-2011" target="_blank">https://doi.org/10.5194/acp-11-10599-2011</a>, 2011.

</mixed-citation></ref-html>
<ref-html id="bib1.bib103"><label>103</label><mixed-citation>
Worton, D. R., Isaacman, G., Gentner, D. R., Dallmann, T. R., Chan, A. W.,
Ruehl, C., Kirchstetter, T. W., Wilson, K. R., Harley, R. A., and Goldstein,
A. H.: Lubricating oil dominates primary organic aerosol emissions from motor
vehicles, Environ. Sci. Technol., 48, 3698–3706, 2014.
</mixed-citation></ref-html>
<ref-html id="bib1.bib104"><label>104</label><mixed-citation>
Yatavelli, R. L., Mohr, C., Stark, H., Day, D. A., Thompson, S. L.,
Lopez-Hilfiker, F. D., Campuzano-Jost, P., Palm, B. B., Vogel, A. L., and
Hoffmann, T.: Estimating the contribution of organic acids to northern
hemispheric continental organic aerosol, Geophys. Res. Lett., 42, 6084–6090,
2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib105"><label>105</label><mixed-citation>
Ye, Q., Robinson, E. S., Ding, X., Ye, P., Sullivan, R. C., and Donahue, N.
M.: Mixing of secondary organic aerosols versus relative humidity, P. Natl.
Acad. Sci. USA, 113, 12649–12654, 2016.
</mixed-citation></ref-html>
<ref-html id="bib1.bib106"><label>106</label><mixed-citation>
Zhang, Q., Alfarra, M. R., Worsnop, D. R., Allan, J. D., Coe, H.,
Canagaratna, M. R., and Jimenez, J. L.: Deconvolution and quantification of
hydrocarbon-like and oxygenated organic aerosols based on aerosol mass
spectrometry, Environ. Sci. Technol., 39, 4938–4952, 2005.
</mixed-citation></ref-html>
<ref-html id="bib1.bib107"><label>107</label><mixed-citation>
Zhang, Q., Jimenez, J. L., Canagaratna, M. R., Ulbrich, I. M., Ng, N. L.,
Worsnop, D. R., and Sun, Y.: Understanding atmospheric organic aerosols via
factor analysis of aerosol mass spectrometry: a review, Anal. Bioanal. Chem.,
401, 3045–3067, <a href="https://doi.org/10.1007/s00216-011-5355-y" target="_blank">https://doi.org/10.1007/s00216-011-5355-y</a>, 2011.
</mixed-citation></ref-html>
<ref-html id="bib1.bib108"><label>108</label><mixed-citation>
Zieger, P., Aalto, P. P., Aaltonen, V., Äijälä, M., Backman, J.,
Hong, J., Komppula, M., Krejci, R., Laborde, M., Lampilahti, J., de Leeuw,
G., Pfüller, A., Rosati, B., Tesche, M., Tunved, P.,
Väänänen, R., and Petäjä, T.: Low hygroscopic scattering
enhancement of boreal aerosol and the implications for a columnar optical
closure study, Atmos. Chem. Phys., 15, 7247–7267,
<a href="https://doi.org/10.5194/acp-15-7247-2015" target="_blank">https://doi.org/10.5194/acp-15-7247-2015</a>, 2015.
</mixed-citation></ref-html>
<ref-html id="bib1.bib109"><label>109</label><mixed-citation>
Zimmermann, R.: Aerosols and health: a challenge for chemical and biological
analysis, Anal. Bioanal. Chem., 407, 5863–5867,
<a href="https://doi.org/10.1007/s00216-015-8832-x" target="_blank">https://doi.org/10.1007/s00216-015-8832-x</a>, 2015.
</mixed-citation></ref-html>--></article>
