<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="en" article-type="review-article">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">metabolites</journal-id>
      <journal-title>Metabolites</journal-title>
      <abbrev-journal-title abbrev-type="publisher">Metabolites</abbrev-journal-title>
      <abbrev-journal-title abbrev-type="pubmed">Metabolites</abbrev-journal-title>
      <issn pub-type="epub">2218-1989</issn>
      <publisher>
        <publisher-name>MDPI</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.3390/metabo2040733</article-id>
      <article-id pub-id-type="publisher-id">metabolites-02-00733</article-id>
      <article-categories>
        <subj-group>
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Computational Methods for Metabolomic Data Analysis of Ion Mobility Spectrometry Data—Reviewing the State of the Art </article-title>
      </title-group>
      
      <contrib-group>
        <contrib contrib-type="author">
          <name>
            <surname>Hauschild</surname>
            <given-names>Anne-Christin</given-names>
          </name>
          <xref rid="af1-metabolites-02-00733" ref-type="aff">1</xref>
          <xref rid="af2-metabolites-02-00733" ref-type="aff">2</xref>
          <xref rid="c1-metabolites-02-00733" ref-type="corresp">*</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Schneider</surname>
            <given-names>Till</given-names>
          </name>
          <xref rid="af1-metabolites-02-00733" ref-type="aff">1</xref>
          <xref rid="af2-metabolites-02-00733" ref-type="aff">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Pauling</surname>
            <given-names>Josch</given-names>
          </name>
          <xref rid="af1-metabolites-02-00733" ref-type="aff">1</xref>
          <xref rid="af2-metabolites-02-00733" ref-type="aff">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Rupp</surname>
            <given-names>Kathrin</given-names>
          </name>
          <xref rid="af3-metabolites-02-00733" ref-type="aff">3</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Jang</surname>
            <given-names>Mi</given-names>
          </name>
          <xref rid="af3-metabolites-02-00733" ref-type="aff">3</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Baumbach</surname>
            <given-names>Jörg Ingo</given-names>
          </name>
          <xref rid="af3-metabolites-02-00733" ref-type="aff">3</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Baumbach</surname>
            <given-names>Jan</given-names>
          </name>
          <xref rid="af1-metabolites-02-00733" ref-type="aff">1</xref>
          <xref rid="af2-metabolites-02-00733" ref-type="aff">2</xref>
          <xref rid="af4-metabolites-02-00733" ref-type="aff">4</xref>
          <xref rid="c1-metabolites-02-00733" ref-type="corresp">*</xref>
        </contrib>
      </contrib-group>
      <aff id="af1-metabolites-02-00733"><label>1 </label>Computational Systems Biology Group, Max Planck Institute for Informatics, D-66123, Saarbrücken, Germany</aff>
      <aff id="af2-metabolites-02-00733"><label>2 </label>Cluster of Excellence for Multimodal Computing and Interaction,Saarland University, D-66123 Saarbrücken, Germany</aff>
      <aff id="af3-metabolites-02-00733"><label>3 </label>Department Microfluidics and Clinical Diagnostics, KIST Europe-Korea Institute of Science and Technology Europe, Campus E7.1, D-66123, Saarbrücken, Germany</aff>
      <aff id="af4-metabolites-02-00733"><label>4 </label>Computational Biology group, Department of Mathematics and Computer Science, University of Southern Denmark, DK-5230, Odense, Denmark</aff>
      <author-notes>
        <corresp id="c1-metabolites-02-00733"><label>*</label> Authors to whom correspondence should be addressed; Email: <email>a.hauschild@mpi-inf.mpg.de</email> (A.C.H.); <email>jan.baumbach@mpi-inf.mpg.de</email> (J.B.); Tel.: +49 681 302-70885 (A.C.H.); Fax: +49 681 9325 399. (A.C.H.); Tel.: +49 681 302 70880 (J.B.); Fax: +49 681 9325 399 (J.B.).</corresp>
      </author-notes>
      <pub-date pub-type="epub">
        <day>16</day>
        <month>10</month>
        <year>2012</year>
      </pub-date>
      <pub-date pub-type="collection"><month>12</month>
        <year>2012</year>
      </pub-date>
      <volume>2</volume>
      <issue>4</issue>
      <fpage>733</fpage>
      <lpage>755</lpage>
      <history>
        <date date-type="received">
          <day>08</day>
          <month>08</month>
          <year>2012</year>
        </date>
        <date date-type="rev-recd">
          <day>24</day>
          <month>09</month>
          <year>2012</year>
        </date>
        <date date-type="accepted">
          <day>25</day>
          <month>09</month>
          <year>2012</year>
        </date>
      </history>
      <permissions>
        <copyright-statement>©  2012 by the authors; licensee MDPI, Basel, Switzerland.</copyright-statement>
        <copyright-year>2012</copyright-year>
        <license xmlns:xlink="http://www.w3.org/1999/xlink" license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/3.0/">
          <p>This article is an open-access article distributed under the terms and conditions of the Creative Commons Attribution license (http://creativecommons.org/licenses/by/3.0/).</p>
        </license>
      </permissions>
      <abstract>
        <p>Ion mobility spectrometry combined with multi-capillary columns (MCC/IMS) is a well known technology for detecting volatile organic compounds (VOCs). We may utilize MCC/IMS for scanning human exhaled air, bacterial colonies or cell lines, for example. Thereby we gain information about the human health status or infection threats. We may further study the metabolic response of living cells to external perturbations. The instrument is comparably cheap, robust and easy to use in every day practice. However, the potential of the MCC/IMS methodology depends on the successful application of computational approaches for analyzing the huge amount of emerging data sets. Here, we will review the state of the art and highlight existing challenges. First, we address methods for raw data handling, data storage and visualization. Afterwards we will introduce de-noising, peak picking and other pre-processing approaches. We will discuss statistical methods for analyzing correlations between peaks and diseases or medical treatment. Finally, we study up-to-date machine learning techniques for identifying robust biomarker molecules that allow classifying patients into healthy and diseased groups. We conclude that MCC/IMS coupled with sophisticated computational methods has the potential to successfully address a broad range of biomedical questions. While we can solve most of the data pre-processing steps satisfactorily, some computational challenges with statistical learning and model validation remain.</p>
      </abstract>
      <kwd-group>
        <kwd>ion mobility spectrometry</kwd>
        <kwd>clinical diagnostics</kwd>
        <kwd>peak detection</kwd>
        <kwd>statistics</kwd>
        <kwd>statistical learning methods</kwd>
        <kwd>metabolomics</kwd>
        <kwd>volatile organic compounds</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="intro">
      <title>1. Introduction</title>
      <p>Ion mobility spectrometers combined with a multi-capillary column (MCC/IMS) are well known for detecting volatile organic compounds (VOCs). Initially developed for military purposes, nowadays they are used for various applications: process control in chemical or petro industry or scanning human exhaled air/breath, bacterial colonies or cell lines for example. The combination of the MCC/IMS methodology and sophisticated computational approaches has the potential to successfully address a broad range of biomedical questions. On the one hand, building statistical models for disease prediction and identification of biomarkers, and on the other hand, determining cell states and metabolic responses of microorganisms or the assessment of food quality.</p>
      <sec>
        <title>1.1. Overview: Ion Mobility Spectrometry</title>
        <p>There are several analytical detection methods for human breath investigations. The major spectrometric methods currently employed are gas chromatography-mass spectrometry (GC/MS) [<xref ref-type="bibr" rid="B1-metabolites-02-00733">1</xref>,<xref ref-type="bibr" rid="B2-metabolites-02-00733">2</xref>,<xref ref-type="bibr" rid="B3-metabolites-02-00733">3</xref>,<xref ref-type="bibr" rid="B4-metabolites-02-00733">4</xref>], solid phase micro extraction-gas chromatography coupled with mass spectrometry (SPME-GC/MS) [<xref ref-type="bibr" rid="B1-metabolites-02-00733">1</xref>,<xref ref-type="bibr" rid="B5-metabolites-02-00733">5</xref>,<xref ref-type="bibr" rid="B6-metabolites-02-00733">6</xref>], electronic noses [<xref ref-type="bibr" rid="B7-metabolites-02-00733">7</xref>,<xref ref-type="bibr" rid="B8-metabolites-02-00733">8</xref>,<xref ref-type="bibr" rid="B9-metabolites-02-00733">9</xref>,<xref ref-type="bibr" rid="B10-metabolites-02-00733">10</xref>], proton transfer reaction-mass spectrometry (PTR-MS) [<xref ref-type="bibr" rid="B11-metabolites-02-00733">11</xref>,<xref ref-type="bibr" rid="B12-metabolites-02-00733">12</xref>] and ion mobility spectrometry (IMS) [<xref ref-type="bibr" rid="B13-metabolites-02-00733">13</xref>,<xref ref-type="bibr" rid="B14-metabolites-02-00733">14</xref>,<xref ref-type="bibr" rid="B15-metabolites-02-00733">15</xref>,<xref ref-type="bibr" rid="B16-metabolites-02-00733">16</xref>,<xref ref-type="bibr" rid="B17-metabolites-02-00733">17</xref>,<xref ref-type="bibr" rid="B18-metabolites-02-00733">18</xref>,<xref ref-type="bibr" rid="B19-metabolites-02-00733">19</xref>]. The real time analysis (e.g. PTR-MS, IMS) has the advantage that no pre-concentration step is needed [<xref ref-type="bibr" rid="B20-metabolites-02-00733">20</xref>]. Sampling is achieved directly by using Tedlar bags [<xref ref-type="bibr" rid="B21-metabolites-02-00733">21</xref>,<xref ref-type="bibr" rid="B22-metabolites-02-00733">22</xref>,<xref ref-type="bibr" rid="B23-metabolites-02-00733">23</xref>], needle traps [<xref ref-type="bibr" rid="B24-metabolites-02-00733">24</xref>], SPME [<xref ref-type="bibr" rid="B5-metabolites-02-00733">5</xref>,<xref ref-type="bibr" rid="B25-metabolites-02-00733">25</xref>], sample loops [<xref ref-type="bibr" rid="B26-metabolites-02-00733">26</xref>] and different adsorbents. They are all non-invasive and should provide early and fast diagnosis or therapy monitoring for the identification of disease-specific biomarkers in the patients’ breath.</p>
        <p>Ion mobility spectrometry is a method to detect volatile organic compounds (VOCs). The first IMS instruments, created in the early 1970s, were originally used for military applications [<xref ref-type="bibr" rid="B27-metabolites-02-00733">27</xref>,<xref ref-type="bibr" rid="B28-metabolites-02-00733">28</xref>]. Further IMS were used to detect drugs or explosives, e.g. at airports. With the growing importance of metabolomics, the focus changed, and today IMS is also used in medical applications. Through combination of the IMS with multi capillary columns (MCC), many possible application opportunities arise. The main advantages of this method are the short time required to collect a sample (about 10 s), the non-invasive nature of the method, the use of easily obtainable exhaled breath, and the robust and easy handling in every day practice. The MCC/IMS based on BioScout was developed by B&amp;S Analytik (Dortmund, Germany) for medical [<xref ref-type="bibr" rid="B29-metabolites-02-00733">29</xref>,<xref ref-type="bibr" rid="B30-metabolites-02-00733">30</xref>] and biomedical [<xref ref-type="bibr" rid="B31-metabolites-02-00733">31</xref>] applications as well as for process analysis [<xref ref-type="bibr" rid="B14-metabolites-02-00733">14</xref>].</p>
        <p>The time needed to acquire a single spectrum takes only 10 ms to 100 ms [<xref ref-type="bibr" rid="B32-metabolites-02-00733">32</xref>]. To receive a MCC/IMS chromatogram a certain setup of the MCC/IMS is needed. Driven by the carrier gas the analytes first reach the MCC, where the pre-separation takes place. In this column there are approx. 1.000 parallel capillaries, each with a film thickness of 200 nm and an inner diameter of 40 µm. In general the OV-5 phase (5% Phenyl / 95% Dimethyl Polysiloxan) is used [<xref ref-type="bibr" rid="B30-metabolites-02-00733">30</xref>]. After passing the MCC, the analytes reach the ionization chamber, where they become chemically ionized by collisions with ionized carrier gas molecules. The carrier gas molecules were previously ionized by a radioactive ionization source (<sup>63</sup>Ni) and from so-called reactant ions. After the chemical ionization, the resulting product ions enter the drift region when the ion shutter is open (<xref ref-type="fig" rid="metabolites-02-00733-f001">Figure 1</xref>). In this region, an external electric field is applied. A so-called drift gas will flow from the Faraday-Plate towards the ions; neutral molecules cannot enter the drift region and the ionized molecules will gain energy from the electric field and soon reach a steady drift velocity by collision with neutral drift gas molecules. That means that all molecules are, in an ideal case, totally separated when they reach the Faraday-Plate. In the end, a spectrum is generated, which is called ion mobility spectrum. The accumulation of all IMS spectra pre-separated by the MCC is called IMS chromatogram.</p>
        <fig id="metabolites-02-00733-f001" position="anchor">
          <label>Figure 1</label>
          <caption>
            <p>Working principle of an Ion Mobility Spectrometer.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="metabolites-02-00733-g001.tif"/>
        </fig>
      </sec>
      <sec>
        <title>1.2. Outline</title>
        <p>The present paper gives an overview of the state of the art data processing, data mining and evaluation methods, used for the analysis of MCC/IMS chromatograms. <xref ref-type="fig" rid="metabolites-02-00733-f002">Figure 2</xref> depicts the workflow of the processing pipeline handling the MCC/IMS data. The first step is the data collection in laboratories and hospitals, both the results of the diagnostic technique analyzing human breath, as well as additional information (e.g., age, gender, medication, medium of the bacterial strain, various diagnostic techniques, <italic>etc</italic>.). The next step is the pre-processing of the chromatograms, enhancing the quality (e.g., de-noising, smoothing) and detecting the VOC areas (peaks). The results are verified using the available visualization tools. The pre-processed data is subsequently accumulated in a centralized data repository, e.g., a database. Furthermore, the additional information of the organism is prepared to be included into the system. Statistical techniques like Mann-Whitney U test and principal component analysis as well as statistical learning methods, e.g., decision tree and support vector machines are applied to find biomarkers. The biomarkers are verified in the wet lab. They may later be used for disease prediction and disease specific pathway analysis. </p>
        
        <p>Each step of the workflow will be explained in the following chapters of this review. We start with a recap of the data format, the visualization and a detailed explanation of the different preprocessing steps: RIP detailing, smoothing, de-noising and peak finding. In addition, an introduction to the existing databases and the future requirements is given. <xref ref-type="sec" rid="sec3-metabolites-02-00733">Section three</xref> depicts the studies using statistical techniques like Mann-Whitney U test, correlation and principle component analysis. We continue with a description of the statistical learning methods applied to MCC/IMS data sets in <xref ref-type="sec" rid="sec4-metabolites-02-00733">section four</xref>. Finally, we will sum up, illuminate unsolved problems, and provide potential solutions.</p>
        <fig id="metabolites-02-00733-f002" position="anchor">
          <label>Figure 2</label>
          <caption>
            <p>Workflow of the data processing, data mining and evaluation methods used in clinical breath diagnostics.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="metabolites-02-00733-g002.tif"/>
        </fig>
      </sec>
    </sec>
    <sec>
      <title>2. First Steps with IMS Data</title>
      <sec id="sec2dot1-metabolites-02-00733">
        <title>2.1. Data Format</title>
        <p>Over the years, the central question that has motivated the application of IMS and MCC/IMS devices has changed from “Is a particular analyte present?” (detection of explosives, drugs, and chemical warfare agents) to “Which analytes are present in which concentration?” (biomedical on-site analysis, drug monitoring, disease fingerprinting) [<xref ref-type="bibr" rid="B33-metabolites-02-00733">33</xref>]. This leads to utilizing computational and bioinformatical techniques, which are explained throughout the following sections. A broader area of application comes with new requirements in terms of tracking experimental conditions, since this may influence not only the measurement itself, but also its interpretation and give vital information for further data processing, such as the combined analysis of data from different studies. Thus, a sophisticated uniform data format is required, which stores not only the data itself but also experimental and technical conditions. Vautz <italic>et al.</italic> proposed such a standard file format [<xref ref-type="bibr" rid="B33-metabolites-02-00733">33</xref>]. It consists of a header and the data matrix. The header comprises all sampling conditions such as general information, sample information, IMS (device) information, external sampling control, and statistics. They also provide standard nomenclature rules and an extension that is dedicated to sensor-controlled sampling. For details, please refer to supplementary material of Vautz <italic>et al.</italic> [<xref ref-type="bibr" rid="B33-metabolites-02-00733">33</xref>]. A later, related publication by Maddula <italic>et al.</italic> suggests an extension to the standard file format, which allows cross-linking gas chromatography/mass selective detector (GC/MSD) data with MCC/IMS data [<xref ref-type="bibr" rid="B34-metabolites-02-00733">34</xref>].</p>
      </sec>
      <sec>
        <title>2.2. Visualization</title>
        <p>Several software tools are available for the visualization of IMS-chromatograms. The software package IPHEX (by A. Bunkowski, University Bielefeld, Germany) supports the visualization including single spectra and total ion current of the MCC [<xref ref-type="bibr" rid="B35-metabolites-02-00733">35</xref>]. The commercial software package VisualNow (B&amp;S Analytik, Dortmund, Germany), which is implemented in Java, is another state of the art software tool. It provides the ability to show two- and three-dimensional plots of the whole IMS chromatogram as well as all technical parameters. The acquired data of the MCC/IMS file includes a set of parameters describing the measurements, experimental setup and a set of single spectra at different retention times, see <xref ref-type="sec" rid="sec2dot1-metabolites-02-00733">Section 2.1</xref> for more details [<xref ref-type="bibr" rid="B36-metabolites-02-00733">36</xref>]. In both software tools the IMS-chromatogram of the selected data file is plotted as a two-dimensional picture, e.g., VisualNow plot shown in <xref ref-type="fig" rid="metabolites-02-00733-f003">Figure 3</xref> (a). </p>
       
        <p>In the MCC/IMS-chromatogram the X-axis represents the reduced inverse mobility 1/Ko (Vs/cm<sup>2</sup>) and the Y-axis shows the retention time (s). The reduced inverse mobility is proportional to the drift time. Moreover, in order to compare spectra obtained using different experimental conditions the value is normalized by temperature and pressure [<xref ref-type="bibr" rid="B37-metabolites-02-00733">37</xref>]. The signal height is the signal from the Faraday plate of the IMS device. In general, the so-called intensity is color-coded in both plots, whereby the yellow color means the highest signal and the white color the lowest. In the three-dimensional plot the Z-axis expresses the intensity [<xref ref-type="bibr" rid="B38-metabolites-02-00733">38</xref>]. In order to compare or show single spectra of different peaks, a spectrum can be selected and shown in a separate plot, which can be examined visually.</p>
        <p>The single spectrum at the selected ion mobility and the single spectrum at the selected retention time in VisualNow are shown in <xref ref-type="fig" rid="metabolites-02-00733-f003">Figure 3</xref> (b) and (c), respectively. Depending on the characteristics of the data, in some cases a three-dimensional plot can be suitable to identify and compare the peaks captured by the MCC/IMS [<xref ref-type="bibr" rid="B36-metabolites-02-00733">36</xref>]. A region in the two-dimensional plot can be selected, and visualized in a three-dimensional plot, see <xref ref-type="fig" rid="metabolites-02-00733-f004">Figure 4</xref> (a) and (b), respectively. </p>
       
        <p>In addition to this, both tools are capable of visualizing a mapping of the MCC retention time to the retention time of a gas chromatographic measurement. For details on the alignment methods between MCC and GC, we refer to [<xref ref-type="bibr" rid="B2-metabolites-02-00733">2</xref>] and [<xref ref-type="bibr" rid="B35-metabolites-02-00733">35</xref>].</p>
         <fig id="metabolites-02-00733-f003" position="anchor">
          <label>Figure 3</label>
          <caption>
            <p><bold>(a)</bold> Visualization of the ion mobility spectrometry (IMS)-chromatogram; <bold>(b)</bold> Single ion mobility spectrum; <bold>(c) </bold>Single multi-capillary column (MCC) spectrum.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="metabolites-02-00733-g003.tif"/>
        </fig>
         <fig id="metabolites-02-00733-f004" position="anchor">
          <label>Figure 4</label>
          <caption>
            <p><bold>(a)</bold> IMS chromatogram; <bold>(b)</bold> A selected area (green) within the MCC/IMS chromatogram is converted into a three-dimensional plot.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="metabolites-02-00733-g004.tif"/>
        </fig>
      </sec>
      <sec id="sec2dot3-metabolites-02-00733"> 
        <title>2.3. Pre-processing</title>
        <p>A MCC/IMS measurement typically consists of more than a million three-dimensional data points indicating signal intensities. Furthermore, there is a characteristic signal structure found in all IMS spectra of a chromatogram that is known as the reactant ion peak (RIP). The RIP is generally the highest and broadest peak and appears in the shape of a broad vertical line on the chromatogram (<xref ref-type="fig" rid="metabolites-02-00733-f005">Figure 5</xref>). The signal descent on the right side of the RIP is called RIP tailing (<xref ref-type="fig" rid="metabolites-02-00733-f005">Figure 5</xref>). RIP tailing can be considered as a source of disturbance. For this reason, Bader <italic>et al.</italic> performed RIP de-tailing by fitting a lognormal function to the mean of all spectra and subtracting this function from each spectrum in the chromatogram [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>]. Bunkowski achieved RIP de-tailing by subtracting the 25% quantile intensity determined for each 1/K0 value over all spectra [<xref ref-type="bibr" rid="B40-metabolites-02-00733">40</xref>].</p>
        
        <p>Besides RIP tailing, the random fluctuation in the signals, casually called noise, affects the ability to distinguish low intensity signals. Basically, all signal and non-signal (background) parts of a spectrum are overlaid by noise. Therefore, the data needs to be pre-processed by smoothing and de-noising methods (Section 2.1.3), in order to improve the signal-to-noise ratio as well as the clarity of the peaks, which are related to specific analytes. As the noise in the IMS data does not typically vary around zero, a baseline correction is performed, which improves the comparison of IMS data. Bader addressed this problem by subtracting the mean intensity of a pure noise region from all spectra of an IMS chromatogram [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>].</p>
        <fig id="metabolites-02-00733-f005" position="anchor">
          <label>Figure 5</label>
          <caption>
            <p>MCC/IMS chromatograms of raw <bold>(a)</bold> smoothed, <bold>(b)</bold> and de-noised, <bold>(c)</bold> data, illustrating the remaining information after de-noising and smoothing. 2D side views of raw <bold>(d)</bold> smoothed, <bold>(e)</bold> and de-noised chromatograms also show different baselines of the peaks caused by RIP tailing; <bold>(f)</bold> [<xref ref-type="bibr" rid="B41-metabolites-02-00733">41</xref>]. Reproduced with permission from Bader <italic>et al.</italic>, International Journal of Ion Mobility Spectrometry published by Springer-Verlag, 2008.</p>
          </caption>
          <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="metabolites-02-00733-g005.tif"/>
        </fig>
        <sec>
          <title>2.3.1. De-noising and Smoothing</title>
          <p>In Bader <italic>et al.</italic> 2008 [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>], a multi resolution analysis was applied to the data, which includes discrete wavelet transforms on different levels of resolution for both de-noising and smoothing, based on a combination of the approaches presented by Urbas <italic>et al.</italic> [<xref ref-type="bibr" rid="B42-metabolites-02-00733">42</xref>], and Cai <italic>et al.</italic> [<xref ref-type="bibr" rid="B43-metabolites-02-00733">43</xref>]. The corresponding wavelet coefficients, utilized to reconstruct the original chromatogram, can be altered using hard and soft thresholding. Removing coefficients corresponding to high frequency regions, independent of the coefficient amplitude, results in smoothing. The elimination of low amplitude coefficients regardless of frequency, results in de-noising. In doing so, IMS data is compressed to 25% or less of the original data, with negligible loss of information.</p>
          <p>Another approach for de-noising is the application of a filter pipeline described by Bunkowski [<xref ref-type="bibr" rid="B40-metabolites-02-00733">40</xref>], where a median filter is first employed for de-noising, followed by a Savitzky-Golay filter, described in Savitzky <italic>et al.</italic> [<xref ref-type="bibr" rid="B44-metabolites-02-00733">44</xref>], and finally a Gaussian filter [<xref ref-type="bibr" rid="B45-metabolites-02-00733">45</xref>]. </p>
          <p>In addition to computational methods for de-noising, which are applied to the raw data, there are also methods for de-noising in electrical engineering, which are considered during the instrument design. Unfortunately all these methods, which are out of the scope of this publication, have the limitation of partial irrecoverable raw data loss. Especially in cases of large concentration differences within one sample and co-existing large, small, and sometimes overlapping peaks, the balance between noise reduction and the potential loss of resolution has to be considered carefully.</p>
        </sec>
        <sec>
          <title>2.3.2. Peak Detection</title>
          <p>After pre-processing, peaks have to be identified in each single MCC/IMS measurement. Bader and Bunkowski developed different strategies to accomplish this task. Bader <italic>et al.</italic> presented three methods for peak finding referred to as Merged Peak Cluster Localization (MPCL), Growing Interval Merging (GIM), and Wavelet-Based Multiscale Peak Detection (WBMPD) [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>]. The algorithms of Bunkowski <italic>et al.</italic> are based on water shed transformation (WST) [<xref ref-type="bibr" rid="B40-metabolites-02-00733">40</xref>]. The methods are explained in the following sections.</p>
          <p><bold>Merged Peak Cluster Localization (MPCL):</bold> This peak picking method utilizes a robust, locally weighted regression and smoothing scatterplot (LOWESS) algorithm by Cleveland <italic>et al.</italic> for baseline correction and reduction of RIP tailing [<xref ref-type="bibr" rid="B46-metabolites-02-00733">46</xref>]. In the first phase, all data points starting after the RIP are separated into two classes (peak and non-peak) by k-means clustering using a Euclidean distance metric of the intensity, whereby the two starting mean values can be chosen. Under the assumption of noise varying around zero, the non-peak class mean can be chosen as zero. Due to a large degree of misclassifications of high noise intensity points to the peak cluster, a filtering step is performed, whereby a peak cluster point is assigned to the non-peak cluster if at least one of its eight neighbor points belongs to the non-peak cluster. In the second phase, different peaks are identified by a merging regions algorithm based on Bruce <italic>et al.</italic> [<xref ref-type="bibr" rid="B47-metabolites-02-00733">47</xref>]. Taking the binary data points delivered from the first phase, adjacent points of the peak class are merged to form one peak. Finally, a set of distinct peaks for a single measurement is obtained. The limitation of this approach lies in the distinction of two overlapping neighbor peaks, where the overlap’s signal intensity is above the peak-to-noise-threshold. In this case, the merging regions algorithm will fail to distinguish between the two peaks [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>].</p>
          <p><bold>Growing interval merging (GIM): </bold>This approach was used to overcome the resolution problems of the previous method. An iterative algorithm starts at the top of the intensity range, separates noise from peak data points and merges the discovered peaks in a stepwise manner along the intensity scale. Noise and RIP thresholds are defined by analysis of the intensity histogram, which is divided into three regions, namely noise (most data points), peak (second most data points) and RIP (small number of data points). The intensity range given in the peak region is divided into subintervals with evenly distributed data points. Those subintervals are scanned stepwise with descending intensity. Subsequently, the data points of the current sub-interval are assigned to the peak class. Afterwards, the second phase of the MPCL method is applied. This process yields peak lists with distinct peaks. All elements of the current peak list are merged with the ones contained in the previous peak list, provided they have several data points in common. Subsequently, the old peak parameters (maximum intensity with 1/K<sub>0</sub> and RT coordinate, two ellipse axes and ellipse area) are overridden by the current parameters. This merging procedure allows the algorithm to distinguish between peaks which overlap or whose in-between area lifts off from the noise. Overall, GIM outperforms MPCL in terms of peak resolution, and extracts six parameters for each peak found. Nevertheless, there are limitations to the method, as overlapping peaks cannot always be distinguished. Furthermore, the separation of peaks with one or more local maxima in the tailing region is not possible.</p>
          <p><bold>Wavelet-based multiscale peak detection (WBMPD): </bold>The third peak-finding method of Bader [<xref ref-type="bibr" rid="B41-metabolites-02-00733">41</xref>] is partly based on “The multiscale processing of single spectra”, introduced by Randolph and Yasui [<xref ref-type="bibr" rid="B48-metabolites-02-00733">48</xref>], which is less suited for processing a series of spectra. Multiple resolution analysis (MRA) is performed using the maximal overlap discrete wavelet transform (MODWT), allowing the sample size to be arbitrary while the discrete wavelet transform is bound to a sample size that is a power of two. Furthermore, MODWT is translation invariant, which is beneficial for shifted IMS chromatograms. Compared to Daubechies D(4) wavelets, Haar wavelets show less artifacts in the RIP region at low retention times in a chromatogram, and are therefore preferred. The stepwise MRA process passes a chromatogram from higher to lower resolutions. It splits the low pass part of the current chromatogram into four sub-images: lowpass-highpass (LH), lowpass-lowpass (LL), highpass-lowpass (HL), and highpass-highpass (HH). The LH image of this so-called wavelet decomposition contains only details, which means the fine-grained variations within the chromatogram, in contrast to the coarse chromatogram structure of the LL image. Here, the GIM method of the previous paragraph is applied to the LH image. All decomposition steps are then connected by merging common peaks. In doing so, current ellipse peak parameters are replaced by ellipse parameters of the next step, where more grainy structures are scanned if both ellipses have peak data points in common. Newly found ellipses, which do not share peak data points, are added to the peak list. Compared to the standalone GIM method, WBMBT can detect peaks enclosed in the shoulder of other peaks. The evaluation of Bader <italic>et al.</italic> shows that this method is highly sensitive, with only a small number of false positive classifications that can be filtered out by a clustering method when comparing a set of measurements.</p>
          <p><bold>Water shed transformation (WST): </bold>Another peak finding method for IMS data is described by Bunkowski [<xref ref-type="bibr" rid="B40-metabolites-02-00733">40</xref>]. This method is based on an approach of Wegner <italic>et al.</italic> [<xref ref-type="bibr" rid="B49-metabolites-02-00733">49</xref>] used for spot detection on 2D gel electrophoresis images. For further details about water shed transformation, the reader is referred to the publications of Meyer <italic>et al.</italic> [<xref ref-type="bibr" rid="B50-metabolites-02-00733">50</xref>] or Vincent <italic>et al.</italic> [<xref ref-type="bibr" rid="B51-metabolites-02-00733">51</xref>].</p>
          <p>The intuitive underlying working principle of this method is as follows. Imagine that an IMS chromatogram image is turned upside down and interpreted as a topographical surface. This surface is flooded with water, from bottom to top, from different sources that are each located at a local intensity maximum (peak). The water will accumulate stepwise in catchment basins from higher to lower intensities, <italic>i.e.</italic>, the highest peaks are filled with water first. </p>
          <p>When the water level reaches the limit of overflow to another basin, a watershed is built which separates the basins. The overall process segments an IMS chromatogram into peaks and peak parameters similar to the aforementioned methods. However, in contrast to the other approaches, this method delivers the volume of a peak, which can then be taken into account for further analysis. Unfortunately, no well-structured assessment of this method is available so far.</p>
        </sec>
        <sec>
          <title>2.3.3. Merging Peak Sets</title>
          <p>Enabling further analysis of differences and similarities between measurements requires a grouping of peaks that are related to the same analyte. Therefore, the determination of peak sets among all measurements, together with the unambiguous assignment of peaks to those sets, is necessary. In all peak finding and characterization approaches described here, typical peak regions serve as peak group descriptors, which are characterized by a center point, 1/K<sub>0</sub> radius, and RT radius, and can also be used to identify specific analytes [<xref ref-type="bibr" rid="B29-metabolites-02-00733">29</xref>,<xref ref-type="bibr" rid="B52-metabolites-02-00733">52</xref>]. The challenge is to refer each peak to a general peak region. Unfortunately, all parameters of a peak related to a particular analyte vary among several measurements. This impedes assignment to the correct peak region, especially if there is a fluctuation in the position of maximum peak intensity. Based on the coordinates of the maximum for each peak, a pipeline of two separate clustering methods is established [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>]. The first clustering is used to find the mean position of each cluster. The second clustering method takes these positions as starting points and associates each peak to a cluster. Bader <italic>et al.</italic> [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>] compared different combinations of clustering methods. The combination of Ward’s clustering method [<xref ref-type="bibr" rid="B53-metabolites-02-00733">53</xref>] (1) with a k-means algorithm using the Euclidean distance; (2) gives the best results according to the variance ratio criterion and average silhouette width [<xref ref-type="bibr" rid="B39-metabolites-02-00733">39</xref>]. </p>
        </sec>
      </sec>
      <sec>
        <title>2.4. Database</title>
        <p>Driven by the demand for rapid data analysis and biomarker discovery, there is a need for the establishment of a centralized data repository to facilitate the identification of analytes and for data mining in studies such as clinical trials. In contrast to other techniques like mass spectrometric data, for which a couple of data organizing tools are available (for example OpenMS [<xref ref-type="bibr" rid="B54-metabolites-02-00733">54</xref>]), the IMS community lacks such a system.</p>
        <p>In 2007, Lesniak developed the first database schema to organize IMS data [<xref ref-type="bibr" rid="B55-metabolites-02-00733">55</xref>]. Nevertheless, this approach is not able to store arbitrary entities, attributes and values, as well as relations between entities, which is beneficial to make the database adaptable to any kind of up-coming medical annotation data. The goal is to allow a flexible management of analytical data (MCC/IMS, GC/MS) combined with medical data (diseases, medication, age, gender, etc.) provided by physicians or biologists. Flexibility can be ensured by an ontology-based generalized data structure, which enables the system to store any kind of information without changing the database schema.</p>
        <p>Note that a major drawback of such a generic model is a performance loss under particular circumstances due to a higher model complexity. Compared to conventional database schemas, queries are more complex and especially attribute-centric queries perform worse [<xref ref-type="bibr" rid="B56-metabolites-02-00733">56</xref>]. However, in a proper case of application, profit can be derived from the flexibility offered by such a model. </p>
        <p>A database system including metabolite profiles and corresponding patient data will allow the extraction of interesting data sets as a starting point for statistical analysis (<xref ref-type="sec" rid="sec3-metabolites-02-00733">Section 3</xref>) and statistical learning (<xref ref-type="sec" rid="sec4-metabolites-02-00733">Section 4</xref>). Such a system is currently being developed at KIST Europe and the Max Planck Institute for Informatics, Saarbrücken Germany.</p>
      </sec>
    </sec>
    <sec id="sec3-metabolites-02-00733">
      <title>3. Statistical Analysis</title>
      <sec>
        <title>3.1. Statistical Tests</title>
        <p>The aim of clinical diagnostics is to detect molecules, so-called biomarkers, that can give the answer to a specific question, e.g., concerning the health status of a person (disease, no-disease). If a single molecule or antibody in the blood, urine or breath having direct relation to the analyzed disease status exists, it can be detected by statistical tests. </p>
        <p>For methodological reasons, the assumption that the intensity of molecules within the chromatogram is drawn from a Gaussian distribution is not valid [<xref ref-type="bibr" rid="B57-metabolites-02-00733">57</xref>]. Therefore the community of ion mobility spectrometry relies on non-parametric tests, especially the Mann-Whitney U test. This test, also called rank sum test, is an unpaired hypothesis test to verify whether two samples are drawn from the same distribution, or more precisely, whether one of two samples of independent observations tends to have smaller values than the other. In the following we briefly describe several studies analyzing exhaled air of patients using MCC/IMS, applied Mann-Whitney U test to distinguish between different health states.</p>
        <p>In 2011, Bessa <italic>et al.</italic> [<xref ref-type="bibr" rid="B58-metabolites-02-00733">58</xref>] and Koczulla <italic>et al.</italic> [<xref ref-type="bibr" rid="B59-metabolites-02-00733">59</xref>] examined the volatile organic compounds in exhaled breath of patients suffering from chronic obstructive pulmonary disease (COPD). The first study used the rank sum test to differentiate between COPD patients and healthy controls. The second study focused on the classification of COPD patients with and without alpha 1-antitrypsin deficiency. In both studies, rank sum analysis led to the identification of potential single biomarker candidates.</p>
        <p>A further example for the application of the rank sum test is the detection of microorganisms in the human body. According to Rabis <italic>et al.</italic> 2011, bacteria produce VOCs [<xref ref-type="bibr" rid="B60-metabolites-02-00733">60</xref>]. In their study, they focused on <italic>pseudomonas aeruginosa</italic>, a bacterium, which is associated with COPD exacerbation. They investigated the exhaled air of <italic>pseudomonas</italic>-infected patients compared to healthy non-smokers. The Mann-Whitney U test was applied to deduce the most discriminative signals, which resulted in a best accuracy of 88%.</p>
      </sec>
      <sec>
        <title>3.2. Correlation</title>
        <p>Another method to evaluate the relation of different variables is the Pearson correlation. In 2011 Maddula <italic>et al.</italic> utilized this to analyze the similarity between the metabolites, which they used as indicators in their disease analysis, especially those identified as important [<xref ref-type="bibr" rid="B61-metabolites-02-00733">61</xref>]. In fact, the Pearson correlation can be used (1) to find sets or clusters of related metabolites exposing the same behavior and (2) to reduce the data set by selecting representatives for each cluster. Moreover, it would be interesting to investigate whether a set of metabolites showing the same pattern also originates from the same pathway.</p>
        <p>Additionally, the Pearson correlation was applied to evaluate whether medication levels detected within the breath can be associated with other state of the art methods for that purpose. Both Kreuder <italic>et al.</italic> [<xref ref-type="bibr" rid="B62-metabolites-02-00733">62</xref>] and Carstens <italic>et al.</italic> [<xref ref-type="bibr" rid="B63-metabolites-02-00733">63</xref>] investigated the intensity of propofol within the breath of patients undergoing anesthesia, utilizing the MCC/IMS technique. While Kreuder <italic>et al.</italic> [<xref ref-type="bibr" rid="B62-metabolites-02-00733">62</xref>] compared the MCC/IMS propofol intensity with the TCI pump calculated plasma values, Carstens <italic>et al.</italic> [<xref ref-type="bibr" rid="B63-metabolites-02-00733">63</xref>] correlated their results with the propofol serum concentration determined by gas chromatography-mass spectrometry (GC/MS). Both studies report a strong correlation between the level of propofol in breath and the used plasma level.</p>
      </sec>
      <sec>
        <title>3.3. Principal Component Analysis</title>
        <p>Principal Component Analysis (PCA), first introduced by Pearson [<xref ref-type="bibr" rid="B64-metabolites-02-00733">64</xref>], is a computational/-mathematical technique that is used in practice to reduce the dimensionality of a given data set and to find linearly independent variables that most dominantly express the underlying data model (principal components). A very high dimensional of the data set can cause extensive over-fitting in any following statistical learning procedures. A prior reduction of the parameter space is necessary. In contrast to other methods that use an orthogonal transformation, a PCA allows for an inverse transformation of the data back into the initial parameter space. Therefore, PCA results can directly be interpreted and used for follow-up analyses. These characteristics are fundamental in the statistical analysis of metabolic measurements derived from IMS breath sampling. Westhoff <italic>et al.</italic> applied a PCA for the detection of distinctive metabolites that separated breath samples taken from COPD patients from those of healthy controls [<xref ref-type="bibr" rid="B65-metabolites-02-00733">65</xref>]. The authors identified a single discriminative analyte (cyclohexanone, CAS 108-94-1) out of 104 initially detected VOCs that classified the datasets with a sensitivity of 60%, a specificity of 91%, and a positive predictive value of 95%. Note that further studies still have to validate this analyte as a COPD indicator. In a related study, Westhoff <italic>et al.</italic> embedded PCA into a comprehensive statistical analysis of IMS breath samples taken from 95 COPD patients and 35 healthy individuals including Mann-Whitney U test, correlation analysis and decision trees [<xref ref-type="bibr" rid="B66-metabolites-02-00733">66</xref>]. Cheung <italic>et al.</italic> applied PCA to Py-GC-DMS data sets of two strains of <italic>B. subtilis</italic> and one strain of <italic>B. megaterium</italic> [<xref ref-type="bibr" rid="B67-metabolites-02-00733">67</xref>]. PCA proved to be sufficient to discriminate bacterial strains on species level, while separation of the two <italic>B. subtilis</italic> strains required chemometric methods using supervised classification. Additionally, the PCA algorithm results in a multidimensional scaling of the original data by using the first two or three principal components. This can be visualized by various software tools or packages for the statistical environment R [<xref ref-type="bibr" rid="B68-metabolites-02-00733">68</xref>]. </p>
      </sec>
    </sec>
    <sec id="sec4-metabolites-02-00733">
      <title>4. Statistical Learning</title>
      <sec>
        <title>4.1. Reduced Ion Mobility Prediction</title>
        <p>Initially, the ion mobility spectrometry method has been used to detect specific target analytes with known reduced ion mobility K<sub>0</sub>. This changed during the shift of application areas from military towards medical and process control purposes resulting in the analysis of complex mixtures in rather humid environment. Therefore, an accurate database of relevant analytes and their specific positions (K<sub>0</sub>, retention time) for automated identification of the peaks within an IMS chromatogram is needed. To create such a database either each reference substance has to be measured by the IMS or parallel measurements with other mass spectrometric methods have to be carried out. However, to create a reference database solely on the basis of these methods is time consuming and expensive. Therefore, computational methods for reduced ion mobility prediction have been developed. </p>
        <p>An early review by Revercomb and Mason describes the fundamental theory of ion mobility (K) on a molecular scale [<xref ref-type="bibr" rid="B69-metabolites-02-00733">69</xref>]. According to this theory, K can be calculated using several factors: charge of the ion, number density of the drift gas, the Bolzmann constant, temperature, ion mass, mass of the drift gas, and the ion collision cross section. Considering constant operating conditions and only single charged positive molecular ions, K as well as K<sub>0</sub> is only dependent on ion mass and collision cross section. For homologous series of compounds the correlations between ion mobility and ion mass are fairly accurate, which was demonstrated by studies on ketones and amines in the late seventies [<xref ref-type="bibr" rid="B70-metabolites-02-00733">70</xref>,<xref ref-type="bibr" rid="B71-metabolites-02-00733">71</xref>]. </p>
        <p>The first attempts to predict K<sub>0</sub> for non-homologous compounds incorporated structural descriptors in addition to the mass, to encode the elusive collision cross section of the fundamental ion mobility theory. Quantitative structure-property relationship methods, namely multiple linear regression and computational neural networks in combination with numeric structural features were utilized to predict the mobility. The set of features consisted of topological, geometric, electrostatic, and combinations of the three types of molecule attributes.</p>
        <p>The validation on a test-set resulted in a root mean square error of around 0.04 [<xref ref-type="bibr" rid="B72-metabolites-02-00733">72</xref>]. A similar set of functional descriptors was used in 2007 in combination with a multiple linear regression for feature selection and a projection pursuit regression for prediction [<xref ref-type="bibr" rid="B73-metabolites-02-00733">73</xref>].</p>
        <p>A more recent approach utilized the information of the number of carbon atoms within the molecule, to predict the reduced ion mobility of polar aliphatic organic compounds. In this study they discovered a linear relation between the number of carbon atoms and the reduced ion mobility of the compounds within a certain homologous series, as a fast and intuitive method for K<sub>0</sub> estimation [<xref ref-type="bibr" rid="B74-metabolites-02-00733">74</xref>].</p>
      </sec>
      <sec>
        <title>4.2. Probabilistic Relational Learning</title>
        <p>Probabilistic relational learning (PRL) is a very active field in research at the intersection of machine learning, logic, and probability theory. Relational models are the most common representation of structured data. Most statistical learning methods work with “flat” data representations, including objects and their attributes. In contrast to this, probabilistic relational models allow the properties of objects to depend probabilistically on each other and on the properties of other related objects. Data as enterprise business information, marketing and sales data and medical records can be explicitly modeled as relational models to discover useful relationships and even more importantly, to discover unknown information [<xref ref-type="bibr" rid="B75-metabolites-02-00733">75</xref>]. </p>
        <p>Particularly the identification of biomarkers is one of the major goals in clinical diagnostic research. A biomarker or a set of biomarkers in clinical breath diagnostics is a VOC or a set of VOCs, of which the presence, absence or intensity is an indicator for a certain disease. Therefore statistical relational learning is well suited for analyzing the structure of IMS data and for identifying biomarkers.</p>
        <p>In IMS research, the methodology of probabilistic relational learning was applied in 2011 for the first time by Finthammer <italic>et al.</italic> for biomarker detection and biomedical diagnosis of bronchial carcinoma [<xref ref-type="bibr" rid="B76-metabolites-02-00733">76</xref>]. First, they applied a k-means algorithm for peak clustering in order to identify the molecules detected by the MCC/IMS. Subsequently, they estimated the probability of a peak cluster (PCi) occurring in a measurement and the conditional probability, <italic>i.e.</italic>, the probability for a measurement including a certain peak PCi originating from a patient suffering from bronchial carcinoma. Based on these probabilities, a set of diagnostic rules for bronchial carcinoma was learned by using Inductive Logic Programming [<xref ref-type="bibr" rid="B77-metabolites-02-00733">77</xref>]. The result is a Markov logic network (MLN) defined as a set of (positive or negative) weighted first-order logic formulas together with a set of constants. <xref ref-type="table" rid="metabolites-02-00733-t001">Table 1</xref> shows an example of the resulting diagnostic rules.</p>
        <table-wrap id="metabolites-02-00733-t001" position="float">
          <object-id pub-id-type="pii">metabolites-02-00733-t001_Table 1</object-id>
          <label>Table 1</label>
          <caption>
            <p>Example of MLN formula emerged from Alchemy’s structure learning (90% accuracy), where <italic>pc i (M )</italic> is the presence of peak cluster number <italic>i</italic> in sample <italic>M</italic> and <italic>bc ( M )</italic> indicates that the sample <italic>M</italic> originates from a patient suffering from bronchial carcinoma (<italic>¬bc ( M )</italic> = healthy control) [<xref ref-type="bibr" rid="B76-metabolites-02-00733">76</xref>]. Reproduced with permission from Finthammer <italic>et al.</italic>, International Journal of Ion Mobility Spectrometry published by Springer-Verlag, 2010.</p>
          </caption>
                    <table>
            <thead>
              <tr>
                <th align="left" valign="middle">#</th>
                <th align="left" valign="middle">Formula </th>
                <th align="center" valign="middle">Weight</th>
              </tr>
            </thead>
            <tbody>
              <tr style="border-top: solid thin">
                <td align="left" valign="middle">37</td>
                <td align="right" valign="middle">
                  <italic>pc7(M ) </italic>
                  <italic>⇒ bc ( M )</italic>
                </td>
                <td align="center" valign="middle">4.43</td>
              </tr>
              <tr>
                <td align="left" valign="middle">39</td>
                <td align="right" valign="middle">
                  <italic>pc11 (M ) </italic>
                  <italic>⇒ pc9(M )</italic>
                </td>
                <td align="center" valign="middle">4.82</td>
              </tr>
              <tr>
                <td align="left" valign="middle">44</td>
                <td align="right" valign="middle">
                  <italic>pc17 (M ) </italic>
                  <italic>∧ pc28 (M ) </italic>
                  <italic>⇒ pc21 (M )</italic>
                </td>
                <td align="center" valign="middle">5.05</td>
              </tr>
              <tr>
                <td align="left" valign="middle">46</td>
                <td align="right" valign="middle">
                  <italic>pc15 (M ) </italic>
                  <italic>∧ pc25 (M ) </italic>
                  <italic>⇒ pc5(M )</italic>
                </td>
                <td align="center" valign="middle">−4.30</td>
              </tr>
              <tr>
                <td align="left" valign="middle">47</td>
                <td align="right" valign="middle">
                  <italic>pc17 (M ) </italic>
                  <italic>∧ pc19 (M ) </italic>
                  <italic>∧ pc20 (M ) </italic>
                  <italic>⇒ pc9(M )</italic>
                </td>
                <td align="center" valign="middle">−8.98</td>
              </tr>
              <tr>
                <td align="left" valign="middle">53</td>
                <td align="right" valign="middle">
                  <italic>pc12 (M ) </italic>
                  <italic>∧ pc20 (M ) </italic>
                  <italic>∧ pc22 (M ) </italic>
                  <italic>⇒ pc11 (M )</italic>
                </td>
                <td align="center" valign="middle">−8.14</td>
              </tr>
              <tr>
                <td align="left" valign="middle">57</td>
                <td align="right" valign="middle">
                  <italic>¬pc1(M ) </italic>
                  <italic>∧¬pc18 (M ) </italic>
                  <italic>∧¬pc23 (M ) </italic>
                  <italic>∧ pc31 (M ) </italic>
                  <italic>⇒ bc ( M )</italic>
                </td>
                <td align="center" valign="middle">6.38</td>
              </tr>
              <tr>
                <td align="left" valign="middle">61</td>
                <td align="right" valign="middle">
                  <italic>¬pc10 (M ) </italic>
                  <italic>∧ pc14 (M ) </italic>
                  <italic>∧¬pc18 (M ) </italic>
                  <italic>∧ pc21 (M ) </italic>
                  <italic>⇒ bc ( M )</italic>
                </td>
                <td align="center" valign="middle">7.15</td>
              </tr>
              <tr>
                <td align="left" valign="middle">62</td>
                <td align="right" valign="middle">
                  <italic>¬pc12 (M ) </italic>
                  <italic>∧¬pc22 (M ) </italic>
                  <italic>∧¬pc30 (M ) </italic>
                  <italic>∧ pc31 (M ) </italic>
                  <italic>⇒ bc ( M )</italic>
                </td>
                <td align="center" valign="middle">7.49</td>
              </tr>
              <tr>
                <td align="left" valign="middle">66</td>
                <td align="right" valign="middle">
                  <italic>pc4(M ) </italic>
                  <italic>∧ pc26 (M ) </italic>
                  <italic>∧ pc28 (M ) </italic>
                  <italic>∧ pc29 (M ) </italic>
                  <italic>⇒ bc ( M )</italic>
                </td>
                <td align="center" valign="middle">−5.62</td>
              </tr>
              <tr>
                <td align="left" valign="middle">68</td>
                <td align="right" valign="middle">
                  <italic>¬pc9(M ) </italic>
                  <italic>∧¬pc13 (M ) </italic>
                  <italic>∧¬pc16 (M ) </italic>
                  <italic>∧ pc23 (M ) </italic>
                  <italic>∧¬pc29 (M ) </italic>
                  <italic>⇒ ¬bc ( M )</italic>
                </td>
                <td align="center" valign="middle">4.01</td>
              </tr>
              <tr>
                <td align="left" valign="middle">70</td>
                <td align="right" valign="middle">
                  <italic>pc1(M ) </italic>
                  <italic>∧ pc3(M ) </italic>
                  <italic>∧¬pc15 (M ) </italic>
                  <italic>∧¬pc23 (M ) </italic>
                  <italic>∧ pc26 (M ) </italic>
                  <italic>⇒ ¬bc ( M )</italic>
                </td>
                <td align="center" valign="middle">−5.18</td>
              </tr>
              <tr>
                <td align="left" valign="middle">72</td>
                <td align="right" valign="middle">
                  <italic>pc0(M ) </italic>
                  <italic>∧¬pc11 (M ) </italic>
                  <italic>∧¬pc12 (M ) </italic>
                  <italic>∧¬pc21 (M ) </italic>
                  <italic>∧ pc22 (M ) </italic>
                  <italic>⇒ ¬bc ( M )</italic>
                </td>
                <td align="center" valign="middle">2.45</td>
              </tr>
              <tr>
                <td align="left" valign="middle">75</td>
                <td align="right" valign="middle">
                  <italic>pc5(M ) </italic>
                  <italic>∧ pc7(M ) </italic>
                  <italic>∧¬pc28 (M ) </italic>
                  <italic>∧¬pc29 (M ) </italic>
                  <italic>∧ pc31 (M ) </italic>
                  <italic>⇒ ¬bc ( M )</italic>
                </td>
                <td align="center" valign="middle">−2.78</td>
              </tr>
              <tr>
                <td align="left" valign="middle">80</td>
                <td align="right" valign="middle">
                  <italic>pc0(M ) </italic>
                  <italic>∧¬pc12 (M ) </italic>
                  <italic>∧¬pc16 (M ) </italic>
                  <italic>∧ pc30 (M ) </italic>
                  <italic>∧¬pc32 (M ) </italic>
                  <italic>⇒ bc ( M )</italic>
                </td>
                <td align="center" valign="middle">−5.55</td>
              </tr>
              <tr>
                <td align="left" valign="middle">81</td>
                <td align="right" valign="middle">
                  <italic>¬pc6(M ) </italic>
                  <italic>∧¬pc13 (M ) </italic>
                  <italic>∧¬pc28 (M ) </italic>
                  <italic>∧ pc31 (M ) </italic>
                  <italic>∧ pc32 (M ) </italic>
                  <italic>⇒ ¬bc ( M )</italic>
                </td>
                <td align="center" valign="middle">5.61</td>
              </tr>
              <tr>
                <td align="left" valign="middle">82</td>
                <td align="right" valign="middle">
                  <italic>¬pc3(M ) </italic>
                  <italic>∧¬pc4(M ) </italic>
                  <italic>∧ pc25 (M ) </italic>
                  <italic>∧¬pc28 (M ) </italic>
                  <italic>∧¬pc32 (M ) </italic>
                  <italic>⇒ ¬bc ( M )</italic>
                </td>
                <td align="center" valign="middle">8.77</td>
              </tr>
              <tr>
                <td align="left" valign="middle">89</td>
                <td align="right" valign="middle">
                  <italic>¬pc3(M ) </italic>
                  <italic>∧¬pc11 (M ) </italic>
                  <italic>∧ pc13 (M ) </italic>
                  <italic>∧¬pc17 (M ) </italic>
                  <italic>∧¬pc31 (M ) </italic>
                  <italic>⇒ ¬bc ( M )</italic>
                </td>
                <td align="center" valign="middle">−5.15</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>The best model in this study was based on the rules shown in <xref ref-type="table" rid="metabolites-02-00733-t001">Table 1</xref>. Estimating the influence of connected peaks regarding the health state achieved a cross validation accuracy of up to 90%. However, MLN learning aims at extracting relational, intelligible information from the observed data, which can hardly be measured by statistical parameters. Nevertheless, the authors state that although the PRL allows drawing some conclusions between the occurrence of peak clusters and bronchial carcinoma, they emphasized that MLNs have certain shortcomings. From the knowledge representation point of view, the weights of a MLN formula have no clear probabilistic semantics and hence only “simple” MLNs are interpretable [<xref ref-type="bibr" rid="B76-metabolites-02-00733">76</xref>].</p>
      </sec>
      <sec>
        <title>4.3. Statistical Learning and Biomarkers</title>
        <p>The general aim of statistical learning is to use the information on the attributes of the samples, encoded in variables or features to infer a certain class. The most common application area of learning methods in bioinformatics is disease prediction. The physician gathers information on both patients suffering from a certain disease and a set of healthy controls. This information is extracted by using different diagnostic techniques, e.g. analyzing blood, urine or breath of the patients, and subsequently used to train computational models.</p>
        <p>The first study using statistical learning approaches on a set of IMS chromatograms to predict the health status of patients was done by Baumbach <italic>et al.</italic> in 2007 [<xref ref-type="bibr" rid="B78-metabolites-02-00733">78</xref>]. They developed a software architecture that analyzed the data of lung cancer patients and healthy persons. Due to a lack of advanced pre-processing and peak location methods, they applied a Gaussian filter to reduce the effect of background noise. The complexity of the model was reduced by decreasing the number of features; the relevant part of each chromatogram (right of the RIP) was separated by a grid, while each feature was calculated as the average intensity of the corresponding grid element. Subsequently, a set of techniques, namely naive Bayes, multi-layer perceptron, and support vector machine (SVM) were applied to achieve an outstanding performance (accuracy and AUC both 99%) distinguishing between the healthy and the diseased [<xref ref-type="bibr" rid="B78-metabolites-02-00733">78</xref>]. Despite the good results, one has to consider that (1) the prediction was done on a comparatively large feature set and a small sample size (35 lung cancer patients and 72 healthy controls), and (2) the accuracy and AUC were evaluated on the training set.</p>
        <p>The next study was carried out only recently in 2011 by Westhoff <italic>et al.</italic> [<xref ref-type="bibr" rid="B66-metabolites-02-00733">66</xref>]. This study incorporated the advanced pre-processing and peak location methods described in <xref ref-type="sec" rid="sec2dot3-metabolites-02-00733">Section 2.3</xref> to extract those positions in the chromatogram that correspond to volatile organic compounds. They utilized Mann-Whitney U tests and a decision tree to classify the measurements of 95 COPD patients and 35 healthy controls. Similar to the previous study, the models were trained on the whole set resulting in a very good performance (accuracy 95%). Additionally, Westhoff <italic>et al.</italic> extracted the most interesting molecules either having the lowest p-values by Mann-Whitney U test or chosen as variables in the decision tree [<xref ref-type="bibr" rid="B66-metabolites-02-00733">66</xref>].</p>
        <p>Another, more recent study by Hauschild <italic>et al.</italic> in 2012 focused on the classification and biomarker identification of COPD and bronchial carcinoma based on MCC/IMS data. The data set was composed of 35 healthy controls (HC) and 84 patients either suffering from chronic obstructive pulmonary disease (COPD) or both COPD and bronchial carcinoma (COPD+BC). Like the study of Westhoff <italic>et al.</italic> [<xref ref-type="bibr" rid="B66-metabolites-02-00733">66</xref>], the advanced pre-processing and peak location methods provided by the VisualNow software were used to build the features for COPD and bronchial carcinoma prediction. To get a broad overview of the potential of the data and the different classification techniques, six different sophisticated statistical learning methods have been applied: Decision trees, naive Bayes, neural networks, random forest and linear as well as radial SVM [<xref ref-type="bibr" rid="B79-metabolites-02-00733">79</xref>]. Similar to the previous studies of Baumbach <italic>et al.</italic> [<xref ref-type="bibr" rid="B78-metabolites-02-00733">78</xref>] and Westhoff <italic>et al.</italic> [<xref ref-type="bibr" rid="B66-metabolites-02-00733">66</xref>], the set of samples was small (119 volunteers), which leads to a very noisy estimation of the predictive performance. Therefore, in contrast to the previous studies, the authors used cross validation to provide an accurate estimate for the actual performance of the predictive model. The random forest was reported to produce the best prediction results for the COPD prediction (accuracy 94%, AUC 92%) and the bronchial carcinoma prediction (accuracy 79%). Due to the low performance, the authors suggest that further analysis of the separation between COPD and bronchial carcinoma patients is needed. In fact, all tested methods showed a very low sensitivity for the COPD class in contrast to a high sensitivity for the BC class, which indicates that the differentiation between class COPD and COPD + BC is difficult. In fact, most of the measurements of COPD patients falsely predicted suffering from both COPD and bronchial carcinoma, which might be reducible to the characteristic of COPD as a common and important independent risk factor for lung cancer. Both studies, Westhoff <italic>et al.</italic> 2011 [<xref ref-type="bibr" rid="B66-metabolites-02-00733">66</xref>] as well as Hauschild <italic>et al.</italic> [<xref ref-type="bibr" rid="B79-metabolites-02-00733">79</xref>], identified a set of ten most informative features, whereby five of these twenty features overlapped in the inverse drift time as well as retention time, which means they represent the same   VOCs. </p>
        <table-wrap id="metabolites-02-00733-t002" position="float">
          <object-id pub-id-type="pii">metabolites-02-00733-t002_Table 2</object-id>
          <label>Table 2</label>
          <caption>
            <p>An overview of the four studies in <xref ref-type="sec" rid="sec4-metabolites-02-00733">Section 4</xref>, analyzing MCC/IMS data of different diseases (bronchial carcinoma (BC) and chronic obstructive pulmonary disease (COPD)). The ACC is the accuracy given by the percentage of correctly classified samples, # is the number of samples in that study, the AUC is the area under the receiver operating characteristics (ROC) curve, and CV indicates whether cross validation was used.</p>
          </caption>
          <table>
            <thead>
              <tr>
                <th align="left" valign="middle">Study</th>
                <th align="left" valign="middle">Disease</th>
                <th align="left" valign="middle">#</th>
                <th align="left" valign="middle">ACC</th>
                <th align="left" valign="middle">AUC</th>
                <th align="left" valign="middle">CV</th>
              </tr>
            </thead>
            <tbody>
              <tr>
                <td align="left" valign="middle">Finthammer <italic>et al.</italic> 2010 [<xref ref-type="bibr" rid="B76-metabolites-02-00733">76</xref>]</td>
                <td align="left" valign="middle">BC</td>
                <td align="left" valign="middle">158</td>
                <td align="left" valign="middle">90%</td>
                <td align="left" valign="middle">-</td>
                <td align="left" valign="middle">√</td>
              </tr>
              <tr>
                <td align="left" valign="middle">Baumbach <italic>et al.</italic> 2007 [<xref ref-type="bibr" rid="B78-metabolites-02-00733">78</xref>]</td>
                <td align="left" valign="middle">BC</td>
                <td align="left" valign="middle">107</td>
                <td align="left" valign="middle">99%</td>
                <td align="left" valign="middle">99%</td>
                <td align="left" valign="middle">-</td>
              </tr>
              <tr>
                <td align="left" valign="middle">Westhoff <italic>et al.</italic> 2011 [<xref ref-type="bibr" rid="B66-metabolites-02-00733">66</xref>]</td>
                <td align="left" valign="middle">COPD</td>
                <td align="left" valign="middle">130</td>
                <td align="left" valign="middle">94%</td>
                <td align="left" valign="middle">-</td>
                <td align="left" valign="middle">-</td>
              </tr>
              <tr>
                <td align="left" valign="middle">Hauschild <italic>et al.</italic> 2012 [<xref ref-type="bibr" rid="B79-metabolites-02-00733">79</xref>]</td>
                <td align="left" valign="middle">COPD and BC</td>
                <td align="left" valign="middle">119</td>
                <td align="left" valign="middle">94%</td>
                <td align="left" valign="middle">92%</td>
                <td align="left" valign="middle">√</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec>
      <title>5. Summary and Conclusion</title>
      <p>We conclude that MCC/IMS coupled with sophisticated computational methods has the potential to successfully address a broad range of biomedical questions. The investigation of a rather large number of volatile metabolites, especially in breath, opens the way for a totally non-invasive method of investigation with respect to systems biology and personalized medicine. Based on the chemical analysis of some mL of volatiles, time series and continuous investigations of cells, organs, animals and humans could be realized. Such continuous sampling is rather complicated using techniques that require the invasive collection of blood or other material. On one hand, detection limits down to the pg/L-range (ppt<sub>v</sub>-range) are achieved in a rather humid and complex environment. On the data analysis side, many problems on the way to a comprehensive framework for the analysis of MCC/IMS chromatograms have been solved, for example, the definition of the data format, the visualization and the general evaluation using statistical techniques. Nevertheless some computational challenges remain, <xref ref-type="table" rid="metabolites-02-00733-t003">Table 3</xref>.</p>
      
      <p>One of the main tasks is to develop a flexible and comprehensive centralized data repository, which is still unsolved. In contrast to this, pre-processing methods like RIP detailing, smoothing and de-noising have been studied extensively in the last five to ten years. However, the assessment of the quality of these techniques has been done solely by visual appearance. The same holds for the results of the peak detection methods, which were evaluated, if at all, using visual comparison with the manually selected peak lists. Besides, the question of when a peak is recognized as a peak is still open and varies from operator to operator. In the future, pre-processing and peak picking methods have to be validated and compared according to the aim of the study, <italic>i.e.</italic>, the classification performance.</p>
      <table-wrap id="metabolites-02-00733-t003" position="float">
        <object-id pub-id-type="pii">metabolites-02-00733-t003_Table 3</object-id>
        <label>Table 3</label>
        <caption>
          <p>This shows the ranking of the achievements in MCC/IMS data analysis using computational methods. </p>
        </caption>
        <table>
          <thead>
            <tr>
              <th align="left" valign="middle">Computational requirements</th>
              <th align="center" valign="middle">Completed</th>
            </tr>
          </thead>
          <tbody>
            <tr>
              <td align="left" valign="middle">Data format</td>
              <td align="center" valign="middle">***</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Visualization</td>
              <td align="center" valign="middle">***</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Pre-processing methods</td>
              <td align="center" valign="middle">**</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Peak detection methods</td>
              <td align="center" valign="middle">**</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Centralized data repository</td>
              <td align="center" valign="middle">*</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Statistical approaches</td>
              <td align="center" valign="middle">***</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Statistical learning methods</td>
              <td align="center" valign="middle">*</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Differentiation of diseases, infections, cancer, etc.</td>
              <td align="center" valign="middle">*</td>
            </tr>
            <tr>
              <td align="left" valign="middle">Disease pathway identification</td>
              <td align="center" valign="middle">-</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
        <fn>
        <p>“***”accomplished; “**” almost complete; “*” first steps have been made; “-” not solved</p>
        </fn>
        </table-wrap-foot>
      </table-wrap>
      
      <p>The next steps in the framework would be biomarker identification and disease classification using statistical methods like Mann-Whitney U tests and more sophisticated learning methods. In contrast to the statistical analysis methods, statistical learning methods train models that are able to predict the class of samples using a set of features found to be most informative for this model. So far, the statistical learning methods applied to MCC/IMS data concentrated solely on supervised methods. However, unsupervised learning methods in general have a great potential of extracting additional information from the data, which has not been shown so far in the present field of interest. Unsupervised clustering methods can find groups of molecules or samples without any information on the classes (healthy vs. disease). Therefore, such methods are to be applied on large datasets generated in multicenter studies in different hospitals and should show their potential with respect to specific and unspecific metabolic questions in the future. To complete the framework, an automated analysis of the IMS data, starting with a centralized database, followed by an automated biomarker identification and classification, is needed, which is generally open for different instrumentations and metabolic questions.</p>
      <p>Such a centralized and flexible storage, which is capable of gathering all kinds of confounding factors, diet or medication, for instance, allows for the discovery of their influence within the IMS chromatograms and hence a more accurate disease modeling accounting for these contaminations. One question has been left untouched so far: “How to find the disease-specific pathway?” Once the most interesting analytes considered as potential biomarkers are detected, the identity of these molecules is determined by mass spectrometric methods. Subsequently, the pathways within the human or bacterial organisms containing these potential biomarkers can be further investigated by novel computational techniques. In a recent review by Khatri <italic>et al.</italic>, these techniques for pathway analysis have been categorized into three generations of approaches: the first-generation "over-representation analysis" (ORA) approaches, the second-generation "functional class scoring" (FCS) approaches, and the third-generation "pathway topology" (PT) approaches [<xref ref-type="bibr" rid="B80-metabolites-02-00733">80</xref>].</p>
      <p>We conclude that the basic computational methods for pre-processing, biomarker identification and disease prediction are available. However, a comprehensive framework providing a pipeline to automatically pre-process and evaluate complete sets of MCC/IMS data is still required.</p>
    </sec>
    
  </body>
  <back>
  <ack>
      <title>Acknowledgments</title>
      <p>The financial support of the Ministry of Education Science and Technology (MEST) of the Republic of Korea is acknowledged thankfully. Part of the work of this paper has been supported by the Deutsche Forschungsgemeinschaft (DFG) within the Collaborative Research Center (Sonderforschungsbereich) SFB 876 “Providing Information by Resource-Constrained Analysis”, project TB1 “Resource-Constrained Analysis of Spectrometry Data”.</p>
      <p>In addition, the work was supported partly by the German Federal Ministry of Economics and Technology based on a decision of the Deutscher Bundestag within the project KF2368102AKO.</p>
    </ack>
    <notes>
      <title>Conflict of Interest</title>
      <p>The authors declare no conflict of interest.</p>
    </notes>
    <ref-list>
      <title>References</title>
      <ref id="B1-metabolites-02-00733">
        <label>1.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ligor</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Ligor</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Amann</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Ager</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Bachler</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Dzien</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Buszewski</surname>
              <given-names>B.</given-names>
            </name>
          </person-group>
          <article-title>The analysis of healthy volunteers' exhaled breath by the use of solid-phase microextraction and GC-MS</article-title>
          <source>J. Breath Res.</source>
          <year>2008</year>
          <volume>2</volume>
          <fpage>046006:1</fpage>
          <lpage>046006:8</lpage>
        </citation>
      </ref>
      <ref id="B2-metabolites-02-00733">
        <label>2.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jünger</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Bödeker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Peak assignment in multi-capillary column - ion mobility spectrometry using comparative studies with gas chromatography-mass spectrometry for exhalred breath analysis</article-title>
          <source>Anal. Bioanal. Chem.</source>
          <year>2010</year>
          <volume>396</volume>
          <fpage>471</fpage>
          <lpage>482</lpage>
          <pub-id pub-id-type="doi">10.1007/s00216-009-3168-z</pub-id>
        </citation>
      </ref>
      <ref id="B3-metabolites-02-00733">
        <label>3.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mieth</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Schubert</surname>
              <given-names>J.K.</given-names>
            </name>
            <name>
              <surname>Groger</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Sabel</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Kischkel</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Fuchs</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Hein</surname>
              <given-names>D.</given-names>
            </name>
            <name>
              <surname>Zimmermann</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Miekisch</surname>
              <given-names>W.</given-names>
            </name>
          </person-group>
          <article-title>Automated Needle Trap Heart-Cut GC/MS and Needle Trap Comprehensive Two-Dimensional GC/TOF-MS for Breath Gas Analysis in the Clinical Environment</article-title>
          <source>Anal. Chem.</source>
          <year>2010</year>
          <volume>82</volume>
          <fpage>2541</fpage>
          <lpage>2551</lpage>
        <pub-id pub-id-type="doi">10.1021/ac100061k</pub-id><pub-id pub-id-type="pmid">20170082</pub-id></citation>
      </ref>
      <ref id="B4-metabolites-02-00733">
        <label>4.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kushch</surname>
              <given-names>I.</given-names>
            </name>
            <name>
              <surname>Schwarz</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Schwentner</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Baumann</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Dzien</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Schmid</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Unterkofler</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Gastl</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Spanel</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Smith</surname>
              <given-names>D.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>Compounds enhanced in a mass spectrometric profile of smokers' exhaled breath versus non-smokers as determined in a pilot study using PTR-MS</article-title>
          <source>J. Breath Res.</source>
          <year>2008</year>
          <volume>2</volume>
          <fpage>026002:1</fpage>
          <lpage>026002:26</lpage>
        </citation>
      </ref>
      <ref id="B5-metabolites-02-00733">
        <label>5.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ligor</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Ligor</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Bajtarevic</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Ager</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Pienz</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Klieber</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Denz</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Fiegl</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Hilbe</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Weiss</surname>
              <given-names>W.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>Determination of volatile organic compounds in exhaled breath of patients with lung cancer using solid phase microextraction and gas chromatography mass spectrometry</article-title>
          <source>Clin. Chem. Lab. Med.</source>
          <year>2009</year>
          <volume>47</volume>
          <fpage>550</fpage>
          <lpage>560</lpage>
        <pub-id pub-id-type="pmid">19397483</pub-id></citation>
      </ref>
      <ref id="B6-metabolites-02-00733">
        <label>6.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Buszewski</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Ulanowska</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Ligor</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Denderz</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Amann</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>Analysis of exhaled breath from smokers, passive smokers and non-smokers by solid-phase microextraction gas chromatography/mass spectrometry</article-title>
          <source>Biomed. Chromatogr.</source>
          <year>2009</year>
          <volume>23</volume>
          <fpage>551</fpage>
          <lpage>556</lpage>
          <pub-id pub-id-type="doi">10.1002/bmc.1141</pub-id>
        </citation>
      </ref>
      <ref id="B7-metabolites-02-00733">
        <label>7.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cheng</surname>
              <given-names>Z.J.</given-names>
            </name>
            <name>
              <surname>Warwick</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Yates</surname>
              <given-names>D.H.</given-names>
            </name>
            <name>
              <surname>Thomas</surname>
              <given-names>P.S.</given-names>
            </name>
          </person-group>
          <article-title>An electronic nose in the discrimination of breath from smokers and non-smokers: a model for toxin exposure</article-title>
          <source>J. Breath Res.</source>
          <year>2009</year>
          <volume>3</volume>
          <fpage>036003/036001</fpage>
          <lpage>036003/036005</lpage>
        </citation>
      </ref>
      <ref id="B8-metabolites-02-00733">
        <label>8.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Dragonieri</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Annema</surname>
              <given-names>J.T.</given-names>
            </name>
            <name>
              <surname>Schot</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>van der Schee</surname>
              <given-names>M.P.C.</given-names>
            </name>
            <name>
              <surname>Spanevello</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Carratu</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Resta</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Rabe</surname>
              <given-names>K.F.</given-names>
            </name>
            <name>
              <surname>Sterk</surname>
              <given-names>P.J.</given-names>
            </name>
          </person-group>
          <article-title>An electronic nose in the discrimination of patients with non-small cell lung cancer and COPD</article-title>
          <source>Lung Cancer</source>
          <year>2009</year>
          <volume>64</volume>
          <fpage>166</fpage>
          <lpage>170</lpage>
          <pub-id pub-id-type="doi">10.1016/j.lungcan.2008.08.008</pub-id>
        </citation>
      </ref>
      <ref id="B9-metabolites-02-00733">
        <label>9.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Dragonieri</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Schot</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Mertens</surname>
              <given-names>B.J.A.</given-names>
            </name>
            <name>
              <surname>le Cessie</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Gauw</surname>
              <given-names>S.A.</given-names>
            </name>
            <name>
              <surname>Spanevello</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Resta</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Willard</surname>
              <given-names>N.P.</given-names>
            </name>
            <name>
              <surname>Vink</surname>
              <given-names>T.J.</given-names>
            </name>
            <name>
              <surname>Rabe</surname>
              <given-names>K.F.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>An electronic nose in the discrimination of patients with asthma and controls</article-title>
          <source>J. Allergy Clin. Immun.</source>
          <year>2007</year>
          <volume>120</volume>
          <fpage>856</fpage>
          <lpage>862</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jaci.2007.05.043</pub-id>
        </citation>
      </ref>
      <ref id="B10-metabolites-02-00733">
        <label>10.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Horvath</surname>
              <given-names>I.</given-names>
            </name>
            <name>
              <surname>Lazar</surname>
              <given-names>Z.</given-names>
            </name>
            <name>
              <surname>Gyulai</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Kollai</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Losonczy</surname>
              <given-names>G.</given-names>
            </name>
          </person-group>
          <article-title>Exhaled biomarkers in lung cancer</article-title>
          <source>Eur. Respir. J.</source>
          <year>2009</year>
          <volume>34</volume>
          <fpage>261</fpage>
          <lpage>275</lpage>
          <pub-id pub-id-type="doi">10.1183/09031936.00142508</pub-id>
        </citation>
      </ref>
      <ref id="B11-metabolites-02-00733">
        <label>11.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Beauchamp</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Kirsch</surname>
              <given-names>F.</given-names>
            </name>
            <name>
              <surname>Buettner</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>Real-time breath gas analysis for pharmacokinetics: monitoring exhaled breath by on-line proton-transfer-reaction mass spectrometry after ingestion of eucalyptol-containing capsules</article-title>
          <source>J. Breath Res.</source>
          <year>2010</year>
          <pub-id pub-id-type="doi">10.1088/1752-7155/4/2/026006</pub-id>
        </citation>
      </ref>
      <ref id="B12-metabolites-02-00733">
        <label>12.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Herbig</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Mueller</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Schallhart</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Titzmann</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Graus</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Hansel</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>On-line breath analysis with PTR-TOF</article-title>
          <source>J. Breath Res.</source>
          <year>2009</year>
          <volume>3</volume>
          <fpage>027004:1</fpage>
          <lpage>027004:10</lpage>
        </citation>
      </ref>
      <ref id="B13-metabolites-02-00733">
        <label>13.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Perl</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Bödecker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Jünger</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Nolte</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Vautz</surname>
              <given-names>W.</given-names>
            </name>
          </person-group>
          <article-title>Alignment of retention time obtained from multicapillary column gas chromatography used for VOC analysis with ion mobility spectrometry</article-title>
          <source>Anal. Bioanal. Chem.</source>
          <year>2010</year>
          <volume>397</volume>
          <fpage>2385</fpage>
          <lpage>2394</lpage>
          <pub-id pub-id-type="doi">10.1007/s00216-010-3798-1</pub-id>
        </citation>
      </ref>
      <ref id="B14-metabolites-02-00733">
        <label>14.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Process analysis using ion mobility spectrometry</article-title>
          <source>Anal. Bioanal. Chem.</source>
          <year>2006</year>
          <volume>384</volume>
          <fpage>1059</fpage>
          <lpage>1070</lpage>
          <pub-id pub-id-type="doi">10.1007/s00216-005-3397-8</pub-id>
        </citation>
      </ref>
      <ref id="B15-metabolites-02-00733">
        <label>15.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
            <name>
              <surname>Westhoff</surname>
              <given-names>M.</given-names>
            </name>
          </person-group>
          <article-title>Ion mobility spectrometry to detect lung cancer and airway infections</article-title>
          <source>Spectrosc. Eur.</source>
          <year>2006</year>
          <volume>18</volume>
          <fpage>22</fpage>
          <lpage>27</lpage>
        </citation>
      </ref>
      <ref id="B16-metabolites-02-00733">
        <label>16.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Westhoff</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Litterst</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Freitag</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Ion mobility spectrometry in the diagnosis of Sarcoidosis: Results of a feasibility study</article-title>
          <source>J. Physiol. Pharmacol.</source>
          <year>2007</year>
          <volume>58</volume>
          <fpage>739</fpage>
          <lpage>751</lpage>
        <pub-id pub-id-type="pmid">18204189</pub-id></citation>
      </ref>
      <ref id="B17-metabolites-02-00733">
        <label>17.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Vautz</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Nolte</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Fobbe</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Breath analysis—performance and potential of ion mobility spectrometry</article-title>
          <source>J. Breath Res.</source>
          <year>2009</year>
        </citation>
      </ref>
      <ref id="B18-metabolites-02-00733">
        <label>18.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Basanta</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Koimtzis</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Singh</surname>
              <given-names>D.</given-names>
            </name>
            <name>
              <surname>Wilson</surname>
              <given-names>I.</given-names>
            </name>
            <name>
              <surname>Thomas</surname>
              <given-names>C.L.P.</given-names>
            </name>
          </person-group>
          <article-title>An adaptive breath sampler for use with human subjects with an impaired respiratory function</article-title>
          <source>Analyst</source>
          <year>2007</year>
          <volume>132</volume>
          <fpage>153</fpage>
          <lpage>163</lpage>
          <pub-id pub-id-type="doi">10.1039/b608608j</pub-id>
        </citation>
      </ref>
      <ref id="B19-metabolites-02-00733">
        <label>19.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Basanta</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Koimtzis</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Thomas</surname>
              <given-names>C.L.P.</given-names>
            </name>
          </person-group>
          <article-title>Sampling and analysis of exhaled breath on human subjects with thermal desorption gas chromatography - differential mobility spectrometry</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2006</year>
          <volume>9</volume>
          <fpage>45</fpage>
          <lpage>49</lpage>
        </citation>
      </ref>
      <ref id="B20-metabolites-02-00733">
        <label>20.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>King</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Kupferthaler</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Frauscher</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Hackner</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Unterkofler</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Teschl</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Hinterhuber</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Amann</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Högl</surname>
              <given-names>B.</given-names>
            </name>
          </person-group>
          <article-title>Measurement of endogenous acetone and isoprene in exhaled breath during sleep</article-title>
          <source>Physiol. Meas.</source>
          <year>2012</year>
          <pub-id pub-id-type="doi">10.1088/0967–3334/33/3/413</pub-id>
        </citation>
      </ref>
      <ref id="B21-metabolites-02-00733">
        <label>21.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lee</surname>
              <given-names>J.H.</given-names>
            </name>
            <name>
              <surname>Hwang</surname>
              <given-names>S.M.</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>D.W.</given-names>
            </name>
            <name>
              <surname>Heo</surname>
              <given-names>G.S.</given-names>
            </name>
          </person-group>
          <article-title>Determination of volatile organic compounds (VOCs) using Tedlar bag/solid-phase microextraction/gas chromatography/mass spectrometry (SPME/GC/MS) in ambient and workplace air</article-title>
          <source>B Korean Chem. Soc.</source>
          <year>2002</year>
          <volume>23</volume>
          <fpage>488</fpage>
          <lpage>496</lpage>
        <pub-id pub-id-type="doi">10.5012/bkcs.2002.23.3.488</pub-id></citation>
      </ref>
      <ref id="B22-metabolites-02-00733">
        <label>22.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Schulz</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Jensen</surname>
              <given-names>M.L.</given-names>
            </name>
            <name>
              <surname>Balsley</surname>
              <given-names>B.B.</given-names>
            </name>
            <name>
              <surname>Davis</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Birks</surname>
              <given-names>J.W.</given-names>
            </name>
          </person-group>
          <article-title>Tedlar bag sampling technique for vertical profiling of carbon dioxide through the atmospheric boundary layer with high precision and accuracy</article-title>
          <source>Environ. Sci. Technol.</source>
          <year>2004</year>
          <volume>38</volume>
          <fpage>3683</fpage>
          <lpage>3688</lpage>
          <pub-id pub-id-type="doi">10.1021/es035046h</pub-id>
        </citation>
      </ref>
      <ref id="B23-metabolites-02-00733">
        <label>23.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Beauchamp</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Herbig</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Gutmann</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Hansel</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>On the use of Tedlar bags for breath-gas sampling and analysis</article-title>
          <source>J. Breath Res.</source>
          <year>2008</year>
          <fpage>046001: 1</fpage>
          <lpage>046001:19</lpage>
        </citation>
      </ref>
      <ref id="B24-metabolites-02-00733">
        <label>24.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Filipiak</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Filipiak</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Ager</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Wiesenhofer</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Amann</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>Optimization of sampling parameters for collection and preconcentration of alveolar air by needle traps</article-title>
          <source>J. Breath Res.</source>
          <year>2012</year>
          <volume>6</volume>
          <fpage>027107</fpage>
          <pub-id pub-id-type="doi">10.1088/1752-7155/6/2/027107</pub-id>
        </citation>
      </ref>
      <ref id="B25-metabolites-02-00733">
        <label>25.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bajtarevic</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Ager</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Pienz</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Klieber</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Schwarz</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Ligor</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Ligor</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Filipiak</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Denz</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Fiegl</surname>
              <given-names>M.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>Noninvasive detection of lung cancer by analysis of exhaled breath</article-title>
          <source>BMC Cancer</source>
          <year>2009</year>
          <pub-id pub-id-type="doi">10.1186/1471-2407-9-348</pub-id>
        </citation>
      </ref>
      <ref id="B26-metabolites-02-00733">
        <label>26.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Miekisch</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Hengstenberg</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Kischkel</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Beckmann</surname>
              <given-names>U.</given-names>
            </name>
            <name>
              <surname>Mieth</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Schubert</surname>
              <given-names>J.K.</given-names>
            </name>
          </person-group>
          <article-title>Construction and Evaluation of a Versatile CO2 Controlled Breath Collection Device</article-title>
          <source>Ieee Sen. J.</source>
          <year>2010</year>
          <volume>10</volume>
          <fpage>211</fpage>
          <lpage>215</lpage>
          <pub-id pub-id-type="doi">10.1109/JSEN.2009.2035757</pub-id>
        </citation>
      </ref>
      <ref id="B27-metabolites-02-00733">
        <label>27.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
            <name>
              <surname>Eiceman</surname>
              <given-names>G.A.</given-names>
            </name>
          </person-group>
          <article-title>Ion Mobility Spectrometry: Arriving On Site and Moving Beyond a Low Profile</article-title>
          <source>Appl. Spectrosc.</source>
          <year>1999</year>
          <volume>53</volume>
          <fpage>338A</fpage>
          <lpage>355A</lpage>
          <pub-id pub-id-type="doi">10.1366/0003702991947847</pub-id>
        </citation>
      </ref>
      <ref id="B28-metabolites-02-00733">
        <label>28.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hill</surname>
              <given-names>H.H.</given-names>
              <suffix>Jr.</suffix>
            </name>
            <name>
              <surname>Siems</surname>
              <given-names>W.F.</given-names>
            </name>
            <name>
              <surname>St Louis</surname>
              <given-names>R.H.</given-names>
            </name>
            <name>
              <surname>McMinn</surname>
              <given-names>D.G.</given-names>
            </name>
          </person-group>
          <article-title>Ion mobility spectrometry</article-title>
          <source>Anal. Chem.</source>
          <year>1990</year>
          <volume>62</volume>
          <fpage>1201A</fpage>
          <lpage>1209A</lpage>
        <pub-id pub-id-type="pmid">2288410</pub-id></citation>
      </ref>
      <ref id="B29-metabolites-02-00733">
        <label>29.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ruzsanyi</surname>
              <given-names>V.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
            <name>
              <surname>Sielemann</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Litterst</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Westhoff</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Freitag</surname>
              <given-names>L.</given-names>
            </name>
          </person-group>
          <article-title>Detection of human metabolites using multi-capillary columns coupled to ion mobility spectrometers</article-title>
          <source>J. Chromatogr. A</source>
          <year>2005</year>
          <volume>1084</volume>
          <fpage>145</fpage>
          <lpage>151</lpage>
          <pub-id pub-id-type="doi">10.1016/j.chroma.2005.01.055</pub-id>
        </citation>
      </ref>
      <ref id="B30-metabolites-02-00733">
        <label>30.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Ion Mobility Spectrometry coupled with Multi-Capillary Columns for Metabolic Profiling of Human Breath</article-title>
          <source>J. Breath Res.</source>
          <year>2009</year>
          <volume>3</volume>
          <fpage>1</fpage>
          <lpage>16</lpage>
        </citation>
      </ref>
      <ref id="B31-metabolites-02-00733">
        <label>31.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Blank</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Schmid</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Detection of volatile metabolites of Escherichia coli by multi capillary column coupled ion mobility spectrometry</article-title>
          <source>Anal. Bioanal. Chem.</source>
          <year>2009</year>
          <volume>394</volume>
          <fpage>791</fpage>
          <lpage>800</lpage>
          <pub-id pub-id-type="doi">10.1007/s00216-009-2758-0</pub-id>
        </citation>
      </ref>
      <ref id="B32-metabolites-02-00733">
        <label>32.</label>
        <citation citation-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Eiceman</surname>
              <given-names>G.A.</given-names>
            </name>
            <name>
              <surname>Karpas</surname>
              <given-names>Z.</given-names>
            </name>
          </person-group>
          <source>Ion Mobility Spectrometry</source>
          <edition>2nd</edition>
          <publisher-name>CRC Press, Taylor &amp; Francis</publisher-name>
          <publisher-loc>Boca Raton, FL, USA</publisher-loc>
          <year>2005</year>
          <volume>1</volume>
          <fpage>337</fpage>
        </citation>
      </ref>
      <ref id="B33-metabolites-02-00733">
        <label>33.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Vautz</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Bödecker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Bader</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Recommendation of a standard format for data sets from GC/IMS with sensor-controlled sampling</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2008</year>
          <volume>11</volume>
          <fpage>71</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-008-0010-9</pub-id>
        </citation>
      </ref>
      <ref id="B34-metabolites-02-00733">
        <label>34.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Rupp</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Recommendation for an upgrade to the standard format in order to cross-link the GC/MSD and the MCC/IMS data</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2012</year>
          <volume>15</volume>
          <fpage>79</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-012-0089-x</pub-id>
        </citation>
      </ref>
      <ref id="B35-metabolites-02-00733">
        <label>35.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bunkowski</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>Software tool for coupling chromatographic total ion current dependencies of GC/MSD and MCC/IMS</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2010</year>
          <volume>13</volume>
          <fpage>169</fpage>
          <lpage>175</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-010-0045-6</pub-id>
        </citation>
      </ref>
      <ref id="B36-metabolites-02-00733">
        <label>36.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bödeker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Vautz</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Visualisation of MCC/IMS—Data</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2008</year>
          <volume>11</volume>
          <fpage>77</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-008-0011-8</pub-id>
        </citation>
      </ref>
      <ref id="B37-metabolites-02-00733">
        <label>37.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Borsdorf</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Eiceman</surname>
              <given-names>G.A.</given-names>
            </name>
          </person-group>
          <article-title>Ion Mobility Spectrometry: Principles and Applications</article-title>
          <source>Appl. Spectrosc. Rev.</source>
          <year>2006</year>
          <volume>41</volume>
          <fpage>323</fpage>
          <lpage>375</lpage>
          <pub-id pub-id-type="doi">10.1080/05704920600663469</pub-id>
        </citation>
      </ref>
      <ref id="B38-metabolites-02-00733">
        <label>38.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cumeras</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Schneider</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Favrod</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Figueras</surname>
              <given-names>E.</given-names>
            </name>
            <name>
              <surname>Gracia</surname>
              <given-names>I.</given-names>
            </name>
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Stability and alignment of MCC/IMS devices</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2012</year>
          <volume>15</volume>
          <fpage>41</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-012-0088-y</pub-id>
        </citation>
      </ref>
      <ref id="B39-metabolites-02-00733">
        <label>39.</label>
        <citation citation-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Bader</surname>
              <given-names>S.</given-names>
            </name>
          </person-group>
          <article-title>Identification and Quantification of Peaks in Spectrometric Data</article-title>
          <publisher-name>Technical University of Dortmund</publisher-name>
          <publisher-loc>Dortmund, Germany</publisher-loc>
          <year>2008</year>
        </citation>
      </ref>
      <ref id="B40-metabolites-02-00733">
        <label>40.</label>
        <citation citation-type="thesis">
          <person-group person-group-type="author">
            <name>
              <surname>Bunkowski</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>MCC-IMS data analysis using automated spectra processing and explorative visualization methods</article-title>
          <comment>PhD thesis, University Bielefeld: Bielefeld, Germany, 2011.</comment>
        </citation>
      </ref>
      <ref id="B41-metabolites-02-00733">
        <label>41.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bader</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Urfer</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Preprocessing of Ion Mobility Spectra by Lognormal Detailing and Wavelet Transform</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2008</year>
          <volume>11</volume>
          <fpage>43</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-008-0005-6</pub-id>
        </citation>
      </ref>
      <ref id="B42-metabolites-02-00733">
        <label>42.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Urbas</surname>
              <given-names>A.A.</given-names>
            </name>
            <name>
              <surname>Harrington</surname>
              <given-names>P.B.</given-names>
            </name>
          </person-group>
          <article-title>Two-dimensional wavelet compression of ion mobility spectra</article-title>
          <source>Anal. Chim. Acta</source>
          <year>2001</year>
          <volume>446</volume>
          <fpage>393</fpage>
          <lpage>412</lpage>
        </citation>
      </ref>
      <ref id="B43-metabolites-02-00733">
        <label>43.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cai</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>de B. Harrington</surname>
              <given-names>P.</given-names>
            </name>
          </person-group>
          <article-title>Different Discrete Wavelet Transforms Applied to Denoising Analytical Data</article-title>
          <source>J. Chem. Inf. Comp. Sci.</source>
          <year>1998</year>
          <volume>38</volume>
          <fpage>1161</fpage>
          <lpage>1170</lpage>
          <pub-id pub-id-type="doi">10.1021/ci980210j</pub-id>
        </citation>
      </ref>
      <ref id="B44-metabolites-02-00733">
        <label>44.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Savitzky</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Golay</surname>
              <given-names>M.J.E.</given-names>
            </name>
          </person-group>
          <article-title>Smoothing and Differentiation of Data by Simplified Least Squares Procedures</article-title>
          <source>Anal. Chem.</source>
          <year>1964</year>
          <volume>36</volume>
          <fpage>1627</fpage>
          <lpage>1639</lpage>
          <pub-id pub-id-type="doi">10.1021/ac60214a047</pub-id>
        </citation>
      </ref>
      <ref id="B45-metabolites-02-00733">
        <label>45.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Haddad</surname>
              <given-names>R.A.</given-names>
            </name>
            <name>
              <surname>Akansu</surname>
              <given-names>A.N.</given-names>
            </name>
          </person-group>
          <article-title>A class of fast Gaussian binomial filters for speech and image-processing</article-title>
          <source>IEEE T. Signal Proces.</source>
          <year>1991</year>
          <volume>39</volume>
          <fpage>723</fpage>
          <lpage>727</lpage>
          <pub-id pub-id-type="doi">10.1109/78.80892</pub-id>
        </citation>
      </ref>
      <ref id="B46-metabolites-02-00733">
        <label>46.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cleveland</surname>
              <given-names>W.S.</given-names>
            </name>
          </person-group>
          <article-title>Robust locally weighted regression and smoothing scatterplots</article-title>
          <source>J. Am. Stat. Assoc.</source>
          <year>1979</year>
          <volume>74</volume>
          <fpage>829</fpage>
          <lpage>836</lpage>
          <pub-id pub-id-type="doi">10.1080/01621459.1979.10481038</pub-id>
        </citation>
      </ref>
      <ref id="B47-metabolites-02-00733">
        <label>47.</label>
        <citation citation-type="confproc">
          <person-group person-group-type="author">
            <name>
              <surname>Bruce</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Balch</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Veloso</surname>
              <given-names>M.</given-names>
            </name>
          </person-group>
          <article-title>Intelligent Robots and Systems, 2000. (IROS 2000)</article-title>
          <source>proceedings of Ieee Fast and inexpensive color image segmentation for interactive robots</source>
          <conf-loc>Takamatsu, Japan</conf-loc>
          <conf-date>31 Oct–05 Nov</conf-date>
          <year>2000</year>
        </citation>
      </ref>
      <ref id="B48-metabolites-02-00733">
        <label>48.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Randolph</surname>
              <given-names>T.W.</given-names>
            </name>
            <name>
              <surname>Yasui</surname>
              <given-names>Y.</given-names>
            </name>
          </person-group>
          <article-title>Multiscale processing of mass spectrometry data</article-title>
          <source>Biometrics</source>
          <year>2006</year>
          <volume>62</volume>
          <fpage>589</fpage>
          <lpage>597</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1541-0420.2005.00504.x</pub-id>
        </citation>
      </ref>
      <ref id="B49-metabolites-02-00733">
        <label>49.</label>
        <citation citation-type="confproc">
          <person-group person-group-type="author">
            <name>
              <surname>Wegner</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Sahlström</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Pleißner</surname>
              <given-names>K.P.</given-names>
            </name>
            <name>
              <surname>Oswald</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Fleck</surname>
              <given-names>E.</given-names>
            </name>
          </person-group>
          <article-title>Bildverarbeitung für die Medizin. Eine hierarchische Wasserscheidentransformation für die Spotdetektion in 2D-Gel-Elektrophorese-Bildern</article-title>
          <source>Proceedings: Bildverarbeitung für die Medizin Aachen</source>
          <conf-loc>Germany</conf-loc>
          <conf-date>26–27 March, 1998</conf-date>
        </citation>
      </ref>
      <ref id="B50-metabolites-02-00733">
        <label>50.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Meyer</surname>
              <given-names>F.</given-names>
            </name>
            <name>
              <surname>Beucher</surname>
              <given-names>S.</given-names>
            </name>
          </person-group>
          <article-title>Morphological segmentation</article-title>
          <source>J. Vis. Commun. Image R</source>
          <year>1990</year>
          <volume>1</volume>
          <fpage>21</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1016/1047-3203(90)90014-M</pub-id>
        </citation>
      </ref>
      <ref id="B51-metabolites-02-00733">
        <label>51.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Vincent</surname>
              <given-names>L.</given-names>
            </name>
          </person-group>
          <article-title>Watersheds in Digital Spaces: An Efficient Algorithm Based on Immersion Simulations</article-title>
          <source>IEEE T. Pattern. Anal.</source>
          <year>1991</year>
          <volume>13</volume>
          <fpage>583</fpage>
          <lpage>598</lpage>
          <pub-id pub-id-type="doi">10.1109/34.87344</pub-id>
        </citation>
      </ref>
      <ref id="B52-metabolites-02-00733">
        <label>52.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bödeker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Vautz</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Peak Finding and Referencing in MCC/IMS - Data</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2008</year>
          <volume>11</volume>
          <fpage>83</fpage>
          <lpage>88</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-008-0012-7</pub-id>
        </citation>
      </ref>
      <ref id="B53-metabolites-02-00733">
        <label>53.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ward</surname>
              <given-names>J.H</given-names>
            </name>
          </person-group>
          <article-title>Hierarchical grouping to optimize an objective function</article-title>
          <source>J. Am. Stat. Assoc.</source>
          <year>1963</year>
          <pub-id pub-id-type="doi">10.1080/01621459.1963.10500845</pub-id>
        </citation>
      </ref>
      <ref id="B54-metabolites-02-00733">
        <label>54.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sturm</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Bertsch</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Gröpl</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Hildebrandt</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Hussong</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Lange</surname>
              <given-names>E.</given-names>
            </name>
            <name>
              <surname>Pfeifer</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Schulz-Trieglaff</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Zerck</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Reinert</surname>
              <given-names>K.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>OpenMS-An open-source software framework for mass spectrometry</article-title>
          <source>BMC Bioinformatics</source>
          <year>2008</year>
          <pub-id pub-id-type="doi">10.1186/1471-2105-9-163</pub-id>
        </citation>
      </ref>
      <ref id="B55-metabolites-02-00733">
        <label>55.</label>
        <citation citation-type="thesis">
          <person-group person-group-type="author">
            <name>
              <surname>Lesniak</surname>
              <given-names>T.</given-names>
            </name>
          </person-group>
          <article-title>Entwurf, Erprobung und Bewertung eines Informationsschemas für Untersuchungen von Metaboliten</article-title>
          <comment>Diploma Thesis, University of Dortmund, Dortmund, Germany, 2007.</comment>
        </citation>
      </ref>
      <ref id="B56-metabolites-02-00733">
        <label>56.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chen</surname>
              <given-names>R.S.</given-names>
            </name>
            <name>
              <surname>Nadkarni</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Marenco</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Levin</surname>
              <given-names>F.</given-names>
            </name>
            <name>
              <surname>Erdos</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Miller</surname>
              <given-names>P.L.</given-names>
            </name>
          </person-group>
          <article-title>Exploring Performance Issues for a Clinical Database Organized Using an Entity-Attribute-Value Representation</article-title>
          <source>J. Am. Med. Inform. Assn.</source>
          <year>2000</year>
          <volume>7</volume>
          <fpage>475</fpage>
          <lpage>487</lpage>
        <pub-id pub-id-type="doi">10.1136/jamia.2000.0070475</pub-id></citation>
      </ref>
      <ref id="B57-metabolites-02-00733">
        <label>57.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Vogtland</surname>
              <given-names>D.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Breit-Wigner-Function and IMS-Signals</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2009</year>
          <volume>12</volume>
          <fpage>109</fpage>
          <lpage>114</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-009-0027-8</pub-id>
        </citation>
      </ref>
      <ref id="B58-metabolites-02-00733">
        <label>58.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bessa</surname>
              <given-names>V.</given-names>
            </name>
            <name>
              <surname>Darwiche</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Teschler</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Sommerwerck</surname>
              <given-names>U.</given-names>
            </name>
            <name>
              <surname>Rabis</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
            <name>
              <surname>Freitag</surname>
              <given-names>L.</given-names>
            </name>
          </person-group>
          <article-title>Detection of volatile organic compounds (VOCs) in exhaled breath of patients with chronic obstructive pulmonary disease (COPD) by ion mobility spectrometry</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2011</year>
          <volume>14</volume>
          <fpage>7</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-011-0060-2</pub-id>
        </citation>
      </ref>
      <ref id="B59-metabolites-02-00733">
        <label>59.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Koczulla</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Hattesohl</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Schmid</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Bödeker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>MCC/IMS as potential noninvasive technique in the diagnosis of patients with COPD with and without alpha 1-antitrypsin deficiency</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2011</year>
          <volume>14</volume>
          <fpage>177</fpage>
          <lpage>185</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-011-0070-0</pub-id>
        </citation>
      </ref>
      <ref id="B60-metabolites-02-00733">
        <label>60.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Rabis</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Sommerwerck</surname>
              <given-names>U.</given-names>
            </name>
            <name>
              <surname>Anhenn</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Darwiche</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Freitag</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Teschler</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Bödeker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Detection of infectious agents in the airways by ion mobility spectrometry of exhaled breath</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2011</year>
          <volume>11</volume>
          <fpage>187</fpage>
          <lpage>195</lpage>
        </citation>
      </ref>
      <ref id="B61-metabolites-02-00733">
        <label>61.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Rabis</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Sommerwerck</surname>
              <given-names>U.</given-names>
            </name>
            <name>
              <surname>Anhenn</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Darwiche</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Freitag</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Teschler</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Correlation analysis on data sets to detect infectious agents in the airways by ion mobility spectrometry of exhaled breath</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2011</year>
          <volume>14</volume>
          <fpage>197</fpage>
          <lpage>206</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-011-0076-7</pub-id>
        </citation>
      </ref>
      <ref id="B62-metabolites-02-00733">
        <label>62.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kreuder</surname>
              <given-names>A.-E.</given-names>
            </name>
            <name>
              <surname>Buchinger</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Kreuer</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Volk</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Characterization of propofol in human breath of patients undergoing anesthesia</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2011</year>
          <volume>14</volume>
          <fpage>167</fpage>
          <lpage>175</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-011-0080-y</pub-id>
        </citation>
      </ref>
      <ref id="B63-metabolites-02-00733">
        <label>63.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Carstens</surname>
              <given-names>E.</given-names>
            </name>
            <name>
              <surname>Hirn</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Quintel</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Nolte</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Juenger</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Perl</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Vautz</surname>
              <given-names>W.</given-names>
            </name>
          </person-group>
          <article-title>On-line determination of serum propofol concentrations by expired air analysis</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2010</year>
          <volume>13</volume>
          <fpage>37</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-010-0036-7</pub-id>
        </citation>
      </ref>
      <ref id="B64-metabolites-02-00733">
        <label>64.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pearson</surname>
              <given-names>K.</given-names>
            </name>
          </person-group>
          <article-title>On lines and planes of closest fit to systems of points in space</article-title>
          <source>Philosophical Magazine</source>
          <year>1901</year>
          <volume>2</volume>
          <fpage>559</fpage>
          <lpage>572</lpage>
        <pub-id pub-id-type="doi">10.1080/14786440109462720</pub-id></citation>
      </ref>
      <ref id="B65-metabolites-02-00733">
        <label>65.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Westhoff</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Litterst</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Bödecker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Rahmann</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Davies</surname>
              <given-names>A.N.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Differentiation of chronic obstructive pulmonary disease (COPD) including lung cancer from healthy control group by breath analysis using ion mobility spectrometry</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2010</year>
          <volume>13</volume>
          <fpage>131</fpage>
          <lpage>139</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-010-0049-2</pub-id>
        </citation>
      </ref>
      <ref id="B66-metabolites-02-00733">
        <label>66.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Westhoff</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Litterst</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Maddula</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Bödeker</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Statistical and bioinformatical methods to differentiate chronic obstructive pulmonary disease (COPD) including lung cancer from healthy control by breath analysis using ion mobility spectrometr</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2011</year>
          <volume>11</volume>
          <fpage>139</fpage>
          <lpage>149</lpage>
        </citation>
      </ref>
      <ref id="B67-metabolites-02-00733">
        <label>67.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Cheung</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>Y.</given-names>
            </name>
            <name>
              <surname>Thomas</surname>
              <given-names>C.L.P.</given-names>
            </name>
            <name>
              <surname>Goodacre</surname>
              <given-names>R.</given-names>
            </name>
          </person-group>
          <article-title>Discrimination of bacteria using pyrolysis-gas chromatography-differential mobility spectrometry (Py-GC-DMS) and chemometrics</article-title>
          <source>Analyst</source>
          <year>2009</year>
          <volume>134</volume>
          <fpage>557</fpage>
          <lpage>563</lpage>
          <pub-id pub-id-type="doi">10.1039/b812666f</pub-id>
        </citation>
      </ref>
      <ref id="B68-metabolites-02-00733">
        <label>68.</label>
        <citation citation-type="web">
          <person-group person-group-type="author">
            <name>
              <surname>Team</surname>
              <given-names>R.D.C.</given-names>
            </name>
          </person-group>
          <article-title>R: A language and environment for statistical computing</article-title>
          <access-date>(accessed on 12 October 2012)</access-date>
          <comment>Available online:<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.google.com.hk/url?sa=t&amp;rct=j&amp;q=A+language+and+environment+for+statistical+computing&amp;source=web&amp;cd=1&amp;ved=0CCoQFjAA&amp;url=http%3A%2F%2Fwww.lsw.uni-heidelberg. de%2Fusers%2Fchristlieb%2Fteaching%2FUKStaSS10%2FR-refman.pdf&amp;ei=_753UMmgJ--eiAeu7IGoAQ&amp;usg=AFQjCNHz-GCuz9CII0JC8onCa91DwwVoHQ&amp;cad=rjt/" ext-link-type="uri">http://www.google.com.hk/url?sa=t&amp;rct=j&amp;q=A+language+and+environment+for+statistical+computing&amp;source=web&amp;cd=1&amp;ved=0CCoQFjAA&amp;url=http%3A%2F%2Fwww.lsw.uni-heidelberg. de%2Fusers%2Fchristlieb%2Fteaching%2FUKStaSS10%2FR-refman.pdf&amp;ei=_753UMmgJ--eiAeu7IGoAQ&amp;usg=AFQjCNHz-GCuz9CII0JC8onCa91DwwVoHQ&amp;cad=rjt/</ext-link></comment>
        </citation>
      </ref>
      <ref id="B69-metabolites-02-00733">
        <label>69.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Revercomb</surname>
              <given-names>H.E.</given-names>
            </name>
            <name>
              <surname>Mason</surname>
              <given-names>E.A.</given-names>
            </name>
          </person-group>
          <article-title>Theory of Plasma Chromatography Gaseous Electrophoresis - Review</article-title>
          <source>Anal. Chem.</source>
          <year>1975</year>
          <volume>47</volume>
          <fpage>970</fpage>
          <lpage>983</lpage>
          <pub-id pub-id-type="doi">10.1021/ac60357a043</pub-id>
        </citation>
      </ref>
      <ref id="B70-metabolites-02-00733">
        <label>70.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Benezra</surname>
              <given-names>S.A.</given-names>
            </name>
          </person-group>
          <article-title>Separation of Mixtures of Aromatic Ketones in Sub-Nanogram Range by Plasma Chromatography</article-title>
          <source>J. Chromatogr. Sci.</source>
          <year>1976</year>
          <volume>14</volume>
          <fpage>122</fpage>
          <lpage>125</lpage>
        </citation>
      </ref>
      <ref id="B71-metabolites-02-00733">
        <label>71.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Karasek</surname>
              <given-names>F.W.</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>S.H.</given-names>
            </name>
            <name>
              <surname>Rokushika</surname>
              <given-names>S.</given-names>
            </name>
          </person-group>
          <article-title>Plasma chromatography of alkyl amines</article-title>
          <source>Anal. Chem.</source>
          <year>1978</year>
          <volume>50</volume>
          <fpage>2013</fpage>
          <lpage>2016</lpage>
          <pub-id pub-id-type="doi">10.1021/ac50036a019</pub-id>
        </citation>
      </ref>
      <ref id="B72-metabolites-02-00733">
        <label>72.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Wessel</surname>
              <given-names>M.D.</given-names>
            </name>
            <name>
              <surname>Sutter</surname>
              <given-names>J.M.</given-names>
            </name>
            <name>
              <surname>Jurs</surname>
              <given-names>P.C.</given-names>
            </name>
          </person-group>
          <article-title>Prediction of Reduced Ion Mobility Constants of Organic Compounds from Molecular Structure</article-title>
          <source>Anal. Chem.</source>
          <year>1996</year>
          <volume>68</volume>
          <fpage>4237</fpage>
          <lpage>4243</lpage>
          <pub-id pub-id-type="doi">10.1021/ac960466t</pub-id>
        </citation>
      </ref>
      <ref id="B73-metabolites-02-00733">
        <label>73.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Liu</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Yao</surname>
              <given-names>X.</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>Z.</given-names>
            </name>
            <name>
              <surname>Fan</surname>
              <given-names>B.</given-names>
            </name>
          </person-group>
          <article-title>Prediction of gas-phase reduced ion mobility constants (K0) based on the multiple linear regression and projection pursuit regression</article-title>
          <source>Talanta</source>
          <year>2007</year>
          <volume>71</volume>
          <fpage>258</fpage>
          <lpage>263</lpage>
          <pub-id pub-id-type="doi">10.1016/j.talanta.2006.03.058</pub-id>
        </citation>
      </ref>
      <ref id="B74-metabolites-02-00733">
        <label>74.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hariharan</surname>
              <given-names>C.B.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
            <name>
              <surname>Vautz</surname>
              <given-names>W.</given-names>
            </name>
          </person-group>
          <article-title>Linearized Equations for the Reduced Ion Mobilities of Polar Aliphatic Organic Compounds</article-title>
          <source>Anal. Chem.</source>
          <year>2010</year>
          <volume>82</volume>
          <fpage>427</fpage>
          <lpage>431</lpage>
          <pub-id pub-id-type="doi">10.1021/ac902459m</pub-id>
        </citation>
      </ref>
      <ref id="B75-metabolites-02-00733">
        <label>75.</label>
        <citation citation-type="confproc">
          <person-group person-group-type="author">
            <name>
              <surname>Friedman</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Getoor</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Koller</surname>
              <given-names>D.</given-names>
            </name>
            <name>
              <surname>Pfeffer</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>Learning Probabilistic Relational Models</article-title>
          <source>Proceedings of the Sixteenth International Joint Conferences on Artificial Intelligence (IJCAI-99)</source>
          <conf-loc>Stockholm, Sweden</conf-loc>
          <conf-date>July 31–August 6 1999</conf-date>
          <fpage>1300</fpage>
          <lpage>1309</lpage>
        </citation>
      </ref>
      <ref id="B76-metabolites-02-00733">
        <label>76.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Finthammer</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Beierle</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Fisseler</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Kern-Isberner</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Möller</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>Probabilistic Relational Learning for Medical Diagnosis Based on Ion Mobility Spectrometry</article-title>
          <source>Int. J. Ion Mobility Spectrom.</source>
          <year>2010</year>
          <volume>13</volume>
          <fpage>83</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1007/s12127-010-0042-9</pub-id>
        </citation>
      </ref>
      <ref id="B77-metabolites-02-00733">
        <label>77.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Muggleton</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>de Raedt</surname>
              <given-names>L.</given-names>
            </name>
          </person-group>
          <article-title>Inductive logic programming: Theory and methods</article-title>
          <source>J. Logic Program.</source>
          <year>1994</year>
          <volume>19/20</volume>
          <fpage>629</fpage>
          <lpage>679</lpage>
          <pub-id pub-id-type="doi">10.1016/0743-1066(94)90035-3</pub-id>
        </citation>
      </ref>
      <ref id="B78-metabolites-02-00733">
        <label>78.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Baumbach</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Bunkowski</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Lange</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Oberwahrenbrock</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Kleinboelting</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Rahmann</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
          </person-group>
          <article-title>IMS2—An integrated medical software system for early lung cancer detection using ion mobility spectrometry data of human breath</article-title>
          <source>J. Integr. Bioinformatics</source>
          <year>2007</year>
          <volume>4</volume>
          <fpage>75</fpage>
        </citation>
      </ref>
      <ref id="B79-metabolites-02-00733">
        <label>79.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hauschild</surname>
              <given-names>A.-C.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.I.</given-names>
            </name>
            <name>
              <surname>Baumbach</surname>
              <given-names>J.</given-names>
            </name>
          </person-group>
          <article-title>Integrated Statistical Learning of Metabolic Ion Mobility - Spectrometry Profiles for Pulmonary Disease Identification</article-title>
          <source>Genet. Mol. Res.</source>
          <year>2012</year>
          <volume>11</volume>
          <fpage>2733</fpage>
          <lpage>2744</lpage>
          <pub-id pub-id-type="doi">10.4238/2012.July.10.17</pub-id>
        </citation>
      </ref>
      <ref id="B80-metabolites-02-00733">
        <label>80.</label>
        <citation citation-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Khatri</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Sirota</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Butte</surname>
              <given-names>A.J.</given-names>
            </name>
          </person-group>
          <article-title>Ten Years of Pathway Analysis: Current Approaches and Outstanding Challenges</article-title>
          <source>PLoS Comput. Biol.</source>
          <year>2012</year>
          <volume>8</volume>
          <fpage>e1002375</fpage>
          <pub-id pub-id-type="doi">10.1371/journal.pcbi.1002375</pub-id>
        </citation>
      </ref>
    </ref-list>
  </back>
</article>
