<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMBE</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Biomed Eng</journal-id>
      <journal-title>JMIR Biomedical Engineering</journal-title>
      <issn pub-type="epub">2561-3278</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v5i1e13611</article-id>
      <article-id pub-id-type="pmid"/>
      <article-id pub-id-type="doi">10.2196/13611</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Robust Feature Engineering for Parkinson Disease Diagnosis: New Machine Learning Techniques</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Korchi</surname>
            <given-names>Amine</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chaibub Neto</surname>
            <given-names>Elias</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Max</given-names>
          </name>
          <degrees>BAdvComp (R&amp;D) (Hons)</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2121-9848</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Ge</surname>
            <given-names>Wenbo</given-names>
          </name>
          <degrees>BE (Hons)</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0429-3061</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Apthorp</surname>
            <given-names>Deborah</given-names>
          </name>
          <degrees>PhD, BPsych (Hons)</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5785-024X</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Suominen</surname>
            <given-names>Hanna</given-names>
          </name>
          <degrees>MSc, Docent, SFHEA, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Research School of Computer Science</institution>
            <institution>College of Engineering and Computer Science</institution>
            <institution>The Australian National University</institution>
            <addr-line>ANU Research School of Computer Science, Hanna Neumann Building, Room 2.35</addr-line>
            <addr-line>145 Science Road</addr-line>
            <addr-line>Canberra, ACT, 2600</addr-line>
            <country>Australia</country>
            <phone>61 431 913 826</phone>
            <email>hanna.suominen@anu.edu.au</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4195-1641</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Research School of Computer Science</institution>
        <institution>College of Engineering and Computer Science</institution>
        <institution>The Australian National University</institution>
        <addr-line>Canberra, ACT</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>School of Psychology</institution>
        <institution>Faculty of Medicine and Health</institution>
        <institution>University of New England</institution>
        <addr-line>Armidale, NSW</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Machine Learning Research Group</institution>
        <institution>Data61</institution>
        <institution>The Commonwealth Scientific and Industrial Research Organisation (CSIRO)</institution>
        <addr-line>Canberra</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Future Technologies</institution>
        <institution>Faculty of Science and Engineering</institution>
        <institution>University of Turku</institution>
        <addr-line>Turku</addr-line>
        <country>Finland</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hanna Suominen <email>hanna.suominen@anu.edu.au</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jan-Dec</season>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>27</day>
        <month>7</month>
        <year>2020</year>
      </pub-date>
      <volume>5</volume>
      <issue>1</issue>
      <elocation-id>e13611</elocation-id>
      <history>
        <date date-type="received">
          <day>4</day>
          <month>2</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>2</day>
          <month>10</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>27</day>
          <month>2</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>5</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Max Wang, Wenbo Ge, Deborah Apthorp, Hanna Suominen. Originally published in JMIR Biomedical Engineering (http://biomedeng.jmir.org), 27.07.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Biomedical Engineering, is properly cited. The complete bibliographic information, a link to the original publication on http://biomedeng.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://biomedeng.jmir.org/2020/1/e13611" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Parkinson disease (PD) is a common neurodegenerative disorder that affects between 7 and 10 million people worldwide. No objective test for PD currently exists, and studies suggest misdiagnosis rates of up to 34%. Machine learning (ML) presents an opportunity to improve diagnosis; however, the size and nature of data sets make it difficult to generalize the performance of ML models to real-world applications.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to consolidate prior work and introduce new techniques in feature engineering and ML for diagnosis based on vowel phonation. Additional features and ML techniques were introduced, showing major performance improvements on the large mPower vocal phonation data set.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We used 1600 randomly selected /aa/ phonation samples from the entire data set to derive rules for filtering out faulty samples from the data set. The application of these rules, along with a joint age-gender balancing filter, results in a data set of 511 PD patients and 511 controls. We calculated features on a 1.5-second window of audio, beginning at the 1-second mark, for a support vector machine. This was evaluated with 10-fold cross-validation (CV), with stratification for balancing the number of patients and controls for each CV fold.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We showed that the features used in prior literature do not perform well when extrapolated to the much larger mPower data set. Owing to the natural variation in speech, the separation of patients and controls is not as simple as previously believed. We presented significant performance improvements using additional novel features (with 88.6% certainty, derived from a Bayesian correlated t test) in separating patients and controls, with accuracy exceeding 58%.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The results are promising, showing the potential for ML in detecting symptoms imperceptible to a neurologist.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>machine learning</kwd>
        <kwd>mobile phone</kwd>
        <kwd>nonlinear dynamics</kwd>
        <kwd>Parkinson disease</kwd>
        <kwd>signal processing, computer-assisted</kwd>
        <kwd>speech</kwd>
        <kwd>biomarkers</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p><italic>Parkinson disease</italic> (PD) affects approximately 1% of the population by the age of 70 years. It is characterized by the deterioration of dopamine-producing neurons in the brain, resulting in symptoms such as abnormal gait, speech, and tremor [<xref ref-type="bibr" rid="ref1">1</xref>]. Current treatments can provide temporary relief from symptoms and slow its progression [<xref ref-type="bibr" rid="ref2">2</xref>]; however, these treatments cannot repair damage from the disease. Thus, obtaining an accurate early diagnosis is of high importance.</p>
        <p>PD is currently diagnosed with a standardized but subjective test administered by a neurologist or a clinician, the <italic>Unified Parkinson’s Disease Rating Scale</italic> (UPDRS) [<xref ref-type="bibr" rid="ref3">3</xref>]. It is not easy to diagnose, as only a subset of symptoms is present in any one patient [<xref ref-type="bibr" rid="ref4">4</xref>] and there are many diseases with similar symptoms [<xref ref-type="bibr" rid="ref5">5</xref>]. PD is especially difficult to diagnose in its early stages, as it is believed that most symptoms only manifest once 20% to 40% of dopamine-producing neurons have deteriorated [<xref ref-type="bibr" rid="ref6">6</xref>]. Autopsy is one of the only reliable ways to confirm diagnosis, and studies have shown a misdiagnosis rate ranging between 9% and 34% [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref7">7</xref>].</p>
        <p>Therefore, the search for a more objective measure for diagnosis is a timely topic in the research community. Discovering more quantifiable biomarkers from sources such as gene expression [<xref ref-type="bibr" rid="ref8">8</xref>] and bodily fluids [<xref ref-type="bibr" rid="ref9">9</xref>] is a promising option; however, it is likely that costs will be prohibitive for most early-stage patients uncertain about diagnosis. <italic>Machine learning</italic> (ML) on data from more accessible sources is another viable option, potentially offering an objective and low-cost tool to assist the neurologist in diagnosis through a smartphone-derived version of the UPDRS [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>In this study, we consolidated feature engineering techniques with advances in ML to develop a strong model for PD diagnosis on a large vocal phonation data set. We explored the challenges involved in training ML models on noisy, crowdsourced data and delved into the field of signal processing for audio data. We also found that the experimental setup for classifying healthy and diagnosed individuals does not match the diagnosis process of a neurologist. In addition to merely presenting results as a performance metric, we provided insights into the behavior of these models and showed that it is possible for ML to exceed the performance of clinicians in precise phonation analysis and potentially uncover new biomarkers for PD.</p>
        <p>There is a major interest in using ML to assist in PD diagnosis, and current results are positive—often the reported accuracy percentage is in the high 90s using only speech or accelerometer data [<xref ref-type="bibr" rid="ref11">11</xref>]. However, these results should not be taken at face value, as the experimental setup involves differentiating between (potentially incorrectly) diagnosed PD patients and <italic>healthy controls</italic> (HCs). This oversimplifies the complexities involved in a neurologist’s diagnosis in a clinical situation, where the clinician must exclude a number of other causes for the symptoms and handle early-stage patients exhibiting minimal symptoms. Furthermore, the data sets associated with these publications generally consist of fewer than 40 subjects. For such small samples, it is difficult to control for bias and to prevent the overfitting of ML models.</p>
        <p>Considering the issues with current data sets, there is an open question as to how ML models should be evaluated. One obvious option is to create a data set by monitoring subjects before any Parkinsonian symptoms until they pass, where the existence of PD can be confirmed through autopsy. With such a longitudinal data set, we could directly compare the performance of ML and neurologists. However, such a data set would be very costly and logistically difficult to collect. To advocate for its collection, there needs to be some evidence of ML effectiveness [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
        <p>Consequently, the question we are most interested in is whether ML techniques can extract more information than observations from a trained clinician. As neurological diagnosis relies on judgment from observation, it is possible that some symptoms are imperceptible but detectable with ML on high-resolution sensor data. Specifically, our research question was to examine whether speech symptoms imperceptible to the human ear can be detected in microphone data using ML.</p>
        <p>A larger data set than those that tend to be used in most studies is required to ensure that the results are statistically robust and not influenced by bias. This is not to say that having a larger data set will ensure that there is less influence of bias, but rather that from a larger data set, we can take subsets that are less influenced by biases. We chose the <italic>mPower data set</italic> [<xref ref-type="bibr" rid="ref12">12</xref>], which contains phonations of the vowel <italic>/aa/</italic> from 6000 patients as recorded by an iPhone microphone at 44<italic>,</italic>100 Hz.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Features</title>
        <p>In this subsection, we describe the methodological background of our study and its feature engineering and signal processing. The subsections after this explain the novel features and materials in our experimental setup. The 2 objectives of these experiments were (1) to consolidate and replicate prior work on a much larger scale and (2) to introduce additional features for dysphonia signal processing to better understand how these features relate to a clinician’s diagnosis with speech.</p>
        <p>Vocal phonation is the prolonged pronunciation of a sound such as <italic>/aa/</italic>. It is an interesting task for diagnosing PD, with evidence symptoms present earlier than other motor symptoms [<xref ref-type="bibr" rid="ref13">13</xref>]. It also avoids the complexities involved in modeling speech and is, therefore, an easier task in the context of ML. Prior works have shown promising performance, with accuracies of up to 91<italic>.</italic>4% [<xref ref-type="bibr" rid="ref14">14</xref>] and 98<italic>.</italic>6% [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
        <p>Biologically, phonation is produced by 2 components: the vocal folds and the vocal tract. The vocal folds consist of a flap called the <italic>glottis</italic>, which can be opened and closed. During phonation, air expelled from the lungs causes the glottis to oscillate, producing sound at a range of frequencies. The lowest of these frequencies—the <italic>fundamental frequency</italic>, <italic>f</italic><sub>0</sub>—represents the duration of 1 oscillation and is often denoted as the <italic>pitch period</italic>. The vocal tract comprises components such as the mouth and nose, and it <italic>shapes</italic> the sound by amplifying and attenuating certain frequencies. The vocal folds and tract can be viewed as a <italic>source-filter model</italic>, where the source of vocal folds generates the sound signal, shaped (or filtered) by the vocal tract. With PD, the impairment of fine motor control reduces control of the glottis, causing incomplete vocal fold closure. The turbulent airflow around the glottis causes a sound described as a <italic>breathy</italic> or <italic>hoarse</italic> voice and results in increased variation over each glottal cycle. This is termed as <italic>dysphonia</italic>. A similar phenomenon occurs when the vocal folds are irritated by physical causes, such as colds, and it is currently unknown whether differentiation between neurological and physical dysphonia is possible. It is also worth noting that airway diseases as well as muscular diseases and other psychological disorders can also affect the process of sound generation.</p>
        <p>People with PD also experience hesitant speech from reduction of cognitive ability and slurred or imprecise articulation from loss of motor control over the vocal tract. This is termed as <italic>dysarthria</italic>. Although dysarthria is very noticeable to humans, it is difficult to quantify it computationally. Spoken language has a wide variety of accents and styles, and it has been shown that models trained on English speakers do not generalize well on German speakers, and vice versa [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>Dysphonia can be measured using <italic>sustained vowel phonations</italic>, which are easier to model with traditional signal processing approaches and are suitable for small data sets. Dysphonia in vowel phonation is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. Optimally, both dysphonia- and dysarthria-related features would be used to build models; however, this study focused specifically on dysphonia because of limitations of the data set under consideration.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>/aa/phonation from an individual with dysphonia. Variations in jitter (variation in glottal cycle periods) and shimmer (variation in glottal cycle amplitude) are common features for the detection of dysphonia. Algorithms computing each glottal cycle are imperfect, especially for heavy dysphonia.</p>
          </caption>
          <graphic xlink:href="biomedeng_v5i1e13611_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Features for Dysphonia</title>
        <p>Data from a microphone are represented as a stream of values, corresponding to the value of the recorded sound wave at each point in time. A basic microphone samples at approximately 44<italic>,</italic>100 Hz and quantizes the wave to 2<sup>16</sup> possible values. The difference between higher sampling rates or more detailed quantization (such as 24 bit) is minimally perceptible to human ears; however, a major problem with low-quality microphones is additional noise and imprecise wave encoding.</p>
        <p>Approaches based on signal processing use features that estimate the qualities associated with dysphonia. We divided them into 3 groups: <italic>general</italic> techniques, which are suitable for any time series signal; <italic>dysphonia-specific</italic> techniques, which have been used in prior work specifically to model dysphonia; and <italic>novel</italic> features, which we have shortlisted from other applications as being potentially effective in quantifying dysphonia.</p>
        <sec>
          <title>General Signal Processing</title>
          <p><italic>Moments</italic> are basic statistical descriptors of a signal, with the first 3 moments representing mean, variance, and skewness. For speech, the mean is largely uninformative, and variance corresponds to volume. The zero-crossing rate measures how quickly the signal oscillates around 0 and is a measure of the signal frequency.</p>
          <p><italic>Entropy</italic> describes the amount of information in a piece of data, if it were modeled by a Bernoulli scheme. It is a simple measure of the complexity/information content of a signal.</p>
          <p>The <italic>Fourier</italic> transform decomposes a signal into the amplitudes of frequencies that compose it. This is referred to as mapping from the <italic>time</italic> domain to the <italic>frequency</italic> or <italic>spectral</italic> domain. For speech, this enables us to determine the frequency bands with more energy, corresponding to the fundamental frequency and harmonics. After performing a Fourier transform, the <italic>spectral entropy</italic> [<xref ref-type="bibr" rid="ref16">16</xref>] can be calculated, which can measure how <italic>sharp</italic> the <italic>f</italic><sub>0</sub> and harmonics of speech are. People with PD are expected to have a lower spectral entropy because of the less precise frequency control, causing a more <italic>blurred</italic> Fourier transform.</p>
          <p><italic>Squared</italic> energy operators, <italic>Teager-Kaiser</italic> energy operators, or other energy operators can obtain the instantaneous frequency and amplitude of a signal [<xref ref-type="bibr" rid="ref17">17</xref>]. Statistics such as mean or SD and other measures can be computed after applying an energy operator.</p>
        </sec>
        <sec>
          <title>Dysphonia Signal Processing</title>
          <p>The major feature present in dysphonic speech is the increased variation between each glottal cycle (<xref rid="figure1" ref-type="fig">Figure 1</xref>). <italic>Jitter</italic> measures the variation in the length of each glottal cycle, and <italic>shimmer</italic> [<xref ref-type="bibr" rid="ref18">18</xref>] is the variation in amplitude. These often rely on detecting each glottal cycle, which is not very accurate with current algorithms [<xref ref-type="bibr" rid="ref19">19</xref>]. The <italic>harmonics-to-noise ratio</italic> (HNR) [<xref ref-type="bibr" rid="ref20">20</xref>] measures the amount of noise in a signal, which correlates with the <italic>hoarseness</italic> or <italic>breathiness</italic> of speech. The HNR has been improved with a more robust <italic>glottal-to-noise excitation</italic> ratio [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
          <p>The <italic>vocal fold excitation ratio</italic> (VFER) is another extension of the HNR developed in the study by Tsanas et al [<xref ref-type="bibr" rid="ref22">22</xref>], which also introduced the <italic>Glottal Quotient</italic> (GQ), a measure of the SD duration while the glottis is opened and closed. Both VFER and GQ are built upon concepts of the fundamental frequency estimation algorithm [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
          <p><italic>Mel-frequency cepstral coefficients</italic> (MFCCs) are one of the most effective features for speech recognition models, so it is no surprise that they are shown to be similarly effective for dysphonia. Speech recognition involves computing the MFCC at short time intervals and using a Markov model or structured neural network to model temporal information, whereas statistical descriptors have been shown to be effective in detecting dysphonia [<xref ref-type="bibr" rid="ref11">11</xref>]. There still exists a gap in understanding the relationships between the coefficients and dysphonia.</p>
          <p>A recent study [<xref ref-type="bibr" rid="ref24">24</xref>] showed that <italic>detrended fluctuation analysis</italic>, originally introduced as a measure of the autocorrelation (<italic>autocorrelation</italic> describes the similarity of a signal to itself when offset by a given interval) of a signal, changes with the amount of turbulent airflow in speakers with dysphonia. This study has also proposed the <italic>recurrence period density entropy</italic> (RPDE), which characterizes the periodicity of a signal. These measures are expected to be lower for speakers with dysphonia because of the noise introduced by turbulent airflow. Another study [<xref ref-type="bibr" rid="ref14">14</xref>] has built upon RPDE to develop <italic>pitch period entropy</italic> as a better measure of the impaired control of pitch experienced by PD patients.</p>
        </sec>
      </sec>
      <sec>
        <title>Novel Features</title>
        <p>Although existing features have achieved good results on their respective data sets, we have obtained improved performance with this additional set of features. These novel features may not directly relate to dysphonia but have been effective in other signal processing applications, most commonly <italic>electroencephalogram</italic> (EEG), which, similar to speech, is difficult to characterize.</p>
        <p>A number of these features relate to <italic>chaos theory</italic>—a field based on understanding the behavior of dynamical systems sensitive to initial conditions [<xref ref-type="bibr" rid="ref25">25</xref>]. One can imagine the generation of a speech signal as a system, where parameters involve the state of components in the vocal tract. Given no change in parameters such as vocal fold tension, regular <italic>/aa/</italic> phonation can be modeled with much fewer dimensions in <italic>phase</italic> space [<xref ref-type="bibr" rid="ref26">26</xref>]—all possible states of a dynamic system.</p>
        <p>The <italic>Lyapunov exponents</italic> quantify the divergence of 2 systems with similar initial parameters. The <italic>largest Lyapunov exponent</italic> (<italic>λ</italic><sup>∗</sup>) characterizes the chaos in a system and is commonly estimated with the algorithm described in the study by Rosenstein et al [<xref ref-type="bibr" rid="ref26">26</xref>], which reconstructs the system dynamics using a time delay technique. The inverse of <inline-graphic xlink:href="biomedeng_v5i1e13611_fig4.png" xlink:type="simple" mimetype="image"/> is the Lyapunov time, which defines how long the behavior of a system can be predicted.</p>
        <p>The <italic>fractal dimension</italic> is also commonly used in the analysis of dynamical systems. It represents the ratio of the log change in detail to the log change in scale of a signal [<xref ref-type="bibr" rid="ref27">27</xref>]. This is similar to the coastline paradox, where measuring a coastline with smaller sticks results in an apparent increase in length. The fractal dimension correlates to the complexity of a signal. It has been shown that the fractal dimension of elderly individuals balancing on a force plate is greater than that of younger individuals [<xref ref-type="bibr" rid="ref28">28</xref>] and, more importantly, that distinct patterns seen in deterministic recurrence quantification analysis of sway (similar to fractal dimension) distinguish patients with PD from controls [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <p>General entropy will not differentiate 2 sequences where the frequency of each variable is the same; however, the sequences 0, 0, 0, 0, 1, 1, 1, 1 and 0, 1, 0, 0, 1, 1, 0, 1 are clearly generated by different stochastic processes. The <italic>approximate</italic> and <italic>sample entropy</italic> aims to quantify this [<xref ref-type="bibr" rid="ref30">30</xref>]. This is extended with multiscale sample entropy [<xref ref-type="bibr" rid="ref31">31</xref>], which is an especially powerful tool in the analysis of biological signals.</p>
        <p>Although signals may appear to have high information content in the time domain, they may be easier to represent in others. For example, the JPEG image compression format primarily relies on human vision, which is less sensitive to high-frequency image details. Images are compressed by taking a Fourier transform and downsampling the high-frequency information. <italic>Spectral entropy</italic> measures the information content of the signal in its frequency-domain representation. The <italic>singular value decomposition</italic> (SVD) factorizes a matrix into orthogonal matrices and <italic>singular values</italic>. <italic>SVD entropy</italic> [<xref ref-type="bibr" rid="ref16">16</xref>] measures the entropy of the singular values obtained when the signal is embedded with the algorithm described in the study by Rosenstein et al [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>Many of these features are not simple to interpret; however, our testing shows that they provided significant improvements over prior features used in the literature.</p>
      </sec>
      <sec>
        <title>Materials</title>
        <p>We chose the mPower data set [<xref ref-type="bibr" rid="ref12">12</xref>]—a crowdsourced data set consisting of 65<italic>,</italic>000 <italic>/aa/</italic> phonation samples from 6000 participants, of which 1200 were participants with PD.</p>
        <p>The primary issue with mPower is quality. Owing to crowdsourcing, participants who are dishonest or perform the task incorrectly can skew results. There are a number of subjects with young-onset PD in mPower; young-onset PD is very uncommon in the general population, but this representation may be possible because of the younger target audience of smartphone apps. Vowel phonation has been captured with a single channel iPhone/iPod microphone at 44,100 Hz, with the different microphone technology in each generation introducing another variable to the model. Hesitation and phonation of vowels other than /aa/ are common, and the distance between the phone and the user varies: with some speaking directly into the microphone, creating <italic>wind noise</italic>, and others at a distance, introducing significant environmental noise.</p>
        <p>We evaluated 1600 randomly selected phonation samples for performing the task correctly, rejecting approximately 40% by using the aforementioned wind, distance, and environmental noise. Using short time energies extracted at 0.1-second intervals with OpenSMILE [<xref ref-type="bibr" rid="ref32">32</xref>], simple metrics such as variance, mean, and ranges were calculated to rank and filter the samples. Placing a threshold on these gave rise to hand-crafted rules to filter the remaining samples. After filtering, 4100 users remained, 900 with PD, each with a single corresponding sample. We then attempted to balance the joint age and gender distribution within the PD and control groups. Every PD participant had a gender and age <italic>twin</italic> (±2 years; the age-matching was conducted in a way that the twin was at most 2 years younger or older than the respective participant) selected; if a <italic>twin</italic> could not be found, that PD participant was discarded. This resulted in 1022 participants, 511 with PD. Standard libraries for computing the features used to build the modeling included the PyREM package for sleep staging from EEG data [<xref ref-type="bibr" rid="ref33">33</xref>], nolds [<xref ref-type="bibr" rid="ref34">34</xref>], and pypsr [<xref ref-type="bibr" rid="ref35">35</xref>] (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). The average <italic>f</italic><sub>0</sub> for males and females was assumed to be 120 Hz and 190 Hz, respectively. Sound bit depth was binned to <inline-graphic xlink:href="biomedeng_v5i1e13611_fig5.png" xlink:type="simple" mimetype="image"/> values for entropy-related calculations. In this feature experiment, we used 6 as the embedding dimension for the time delay embedding methods and calculated τ following the study by Rosenstein et al [<xref ref-type="bibr" rid="ref26">26</xref>]. Ethical aspects of this research have been approved by the ANU Human Research Ethics Committee with protocol number 2018/108.</p>
        <boxed-text id="box1" position="float">
          <title>Summary of the features used to build the model.</title>
          <p>
            <bold>Dysphonia features</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Prior dysphonia features from the study by Tsanas et al [<xref ref-type="bibr" rid="ref11">11</xref>]</p>
            </list-item>
            <list-item>
              <p>Wavelet transform–based features [<xref ref-type="bibr" rid="ref36">36</xref>]</p>
            </list-item>
          </list>
          <p>
            <bold>Novel features</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Higuchi and Petrosian fractal dimension</p>
            </list-item>
            <list-item>
              <p>Hurst exponent</p>
            </list-item>
            <list-item>
              <p>Time delay (<italic>τ</italic>)</p>
            </list-item>
            <list-item>
              <p>Lyapunov exponents (up to 6)</p>
            </list-item>
            <list-item>
              <p>Sample and approximate entropy (with <italic>r</italic> selected by Lu et al [<xref ref-type="bibr" rid="ref37">37</xref>]) and Fisher information [<xref ref-type="bibr" rid="ref38">38</xref>]</p>
            </list-item>
            <list-item>
              <p>Spectral entropy</p>
            </list-item>
            <list-item>
              <p>Singular value decomposition entropy</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Initial Model Validation: Replicating the Previous Results</title>
        <p>In a previous study, Tsanas et al [<xref ref-type="bibr" rid="ref11">11</xref>] used the National Crime Victimization Survey data set, which consists of 263 phonations from 33 people with PD and 10 HCs. A set of 132 features was calculated, and 100 times repeated 10-fold cross-validation (CV) was used to evaluate a <italic>support vector machine</italic> (SVM). On all features, they achieved 97.7% accuracy, and on a 10-feature subset selected by ReliefF, they achieved 98.6% accuracy. They also released an open-source toolbox to assist in replicating the results.</p>
        <p>Using this toolbox on our data set, we calculated features on a 1.5-second window of audio beginning at the 1-second mark. An SVM was evaluated with 10 times repeated 10-fold CV over the full feature set and the 10-feature ReliefF subset (<xref ref-type="table" rid="table1">Table 1</xref>). The data set was stratified by random sampling such that there were equal numbers of PD and control subjects in each fold of CV to better highlight performance. Note that this effectively reduced the data set to approximately 1700 phonations. A grid search was used to select the optimal hyperparameters for the SVM. Of the kernels tested, the <italic>radial basis function</italic> (RBF) was dominant in all models. A Bayesian correlated <italic>t</italic> test on accuracy was used to determine if a model dominated another [<xref ref-type="bibr" rid="ref39">39</xref>]. Accuracy was chosen, despite the recent popularity of the <italic>area under the receiver operating characteristic curve</italic> (AUROC) because of criticisms of its bias toward certain predictors [<xref ref-type="bibr" rid="ref40">40</xref>]. However, for the purposes of comparison with previously published work, we also reported sensitivity, specificity, and AUROC.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Cross-validation results of a support vector machine using the full feature set and 10-feature ReliefF subset.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Performance measures</td>
                <td>Full, mean (SD)</td>
                <td>ReliefF subset<sup>a</sup>, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Accuracy (%)</td>
                <td>55.6 (4.9)</td>
                <td>55.6 (4.5)</td>
              </tr>
              <tr valign="top">
                <td>Sensitivity (%)</td>
                <td>52.3 (7.0)</td>
                <td>47.4 (6.6)</td>
              </tr>
              <tr valign="top">
                <td>Specificity (%)</td>
                <td>58.8 (7.8)</td>
                <td>63.8 (8.1)</td>
              </tr>
              <tr valign="top">
                <td>Area under the receiver operating characteristic curve (%)</td>
                <td>57.7 (5.7)</td>
                <td>58.2 (5.2)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>There is a 50.7% probability that the average performance of the ReliefF subset outperforms the full feature set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Initial Model Validation: Improving Previous Results With Novel Features</title>
        <p>The performance of the features by Tsanas et al [<xref ref-type="bibr" rid="ref11">11</xref>] on the mPower data was evidently worse than that of the NCVS data set. It is possible that this was a consequence of the noisier and lower-quality mPower data. However, overfitting in the original study by Tsanas et al [<xref ref-type="bibr" rid="ref11">11</xref>] is also highly likely, especially as evidenced by the fact that the MFCC-heavy ReliefF feature subset performed better in experiments by Tsanas et al [<xref ref-type="bibr" rid="ref11">11</xref>], whereas it performed substantially worse in our testing, achieving 55.6% accuracy rather than 98.6%. Another consideration is the number of observations within each group; having more participants within one group can arbitrarily increase accuracy. It is also ambiguous whether the authors had stratified the phonations on a per-subject scale—failure to do so introduces the <italic>digital fingerprinting</italic> effect. The analysis provided in a recent study [<xref ref-type="bibr" rid="ref41">41</xref>] exemplifies this, showing that allowing phonations from a subject to appear in both training and testing results in an AUROC of approximately 96%, compared with only 59% in a correctly stratified example.</p>
        <p>The features used in the prior literature were clearly insufficient to perform an accurate diagnosis. To improve the model, we introduced an additional range of features that have been effectively applied in the analysis of other biological signals. These features are not directly related to human hearing or speech and thus may be especially useful in detecting symptoms unnoticeable by an expert. We repeated the experiments, adding the novel features, with the results presented in <xref ref-type="table" rid="table2">Table 2</xref> showing significant improvement.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Cross validation results of the support vector machines using different feature sets.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="440"/>
            <col width="190"/>
            <col width="190"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Performance measures</td>
                <td>ReliefF subset, mean (SD)</td>
                <td>Novel only, mean (SD)</td>
                <td>Combined<sup>a</sup>, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Accuracy (%)</td>
                <td>55.6 (4.5)</td>
                <td>55.3 (4.8)</td>
                <td>58.2 (5.1)</td>
              </tr>
              <tr valign="top">
                <td>Sensitivity (%)</td>
                <td>47.4 (6.6)</td>
                <td>45.1 (6.5)</td>
                <td>56.4 (6.8)</td>
              </tr>
              <tr valign="top">
                <td>Specificity (%)</td>
                <td>63.8 (8.1)</td>
                <td>65.5 (7.6)</td>
                <td>60.0 (7.0)</td>
              </tr>
              <tr valign="top">
                <td>Area under the receiver operating characteristic curve (%)</td>
                <td>58.2 (5.2)</td>
                <td>58.2 (5.2)</td>
                <td>60.7 (5.9)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>There is an 88.7% probability that the average performance of the combined subset outperforms the ReliefF subset.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Further Improvements: Ensemble Models and Data Augmentation</title>
        <p>Although the performance was improved, a 58.2% diagnosis accuracy is still far below the requirements for clinical use. In this section, we explore the reasons for the below-expected performance and methods of improving it.</p>
        <p>Many dysphonia features rely on estimating the precise length of each glottal cycle, for which the <italic>f</italic><sub>0</sub> algorithm of Camacho [<xref ref-type="bibr" rid="ref42">42</xref>] was used. A preliminary investigation showed that the SD of <italic>f</italic><sub>0</sub> exceeded 10 Hz for 18% of the phonations. This was indicative of a substantial failure of the algorithm or a poorly executed recording.</p>
        <sec>
          <title>Ensemble Models</title>
          <p>Visualizing the features as in <xref rid="figure2" ref-type="fig">Figure 2</xref>, it is evident that there are distinct distributions for individuals who are healthy and have PD as well as for males and females. However, there is a large amount of variance and overlap over these distributions, making it infeasible to perform diagnosis over one feature alone.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Visualization of detrended fluctuation analysis against recurrence period density entropy in male and female participants with PD and controls. Although the groups follow distinct distributions, there is heavy overlap. It is evidently difficult to classify PD based on any single feature, and powerful machine learning models are required to make sense of their relationships. PD: Parkinson disease.</p>
            </caption>
            <graphic xlink:href="biomedeng_v5i1e13611_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>Typically, an SVM only performs well if the features are good, which may require a lot of prior knowledge. This is because SVMs can only model linear relationships and, even with the use of nonlinear kernels, are restricted to that particular kernel and are often simple. Other algorithms, such as neural networks, can potentially learn to exploit complex nonlinear relationships between the features to increase performance.</p>
          <p>Given the complex relationships between features, it is possible that an ensemble model may achieve better performance. Ensemble models utilize multiple ML models and combine them to create a more powerful one. These ML models can typically be combined by averaging (ie, <italic>voting</italic>) or with other methods (eg, <italic>stacking</italic>), making the combined prediction more powerful than its individual parts.</p>
          <p>Building on stacking, <italic>feature-weighted linear stacking</italic> (FWLS [<xref ref-type="bibr" rid="ref43">43</xref>]) assigns a weight to each feature and model combination. This is motivated by different models being more suitable for using certain features. FWLS was the technique used to ensemble the hundred-model winner of the prestigious Netflix Prize [<xref ref-type="bibr" rid="ref44">44</xref>].</p>
          <p>We ensembled an SVM; Gaussian process; random forest; <italic>k</italic>-nearest neighbor classifier (with <italic>k</italic>=3); and simple dense neural networks with 3, 5, and 7 hidden layers. All models were suited to the task, diagnosing PD within 3% accuracy of each other. An RBF Gaussian process was chosen to aggregate the models in the stacking and FWLS-based ensembles, as Gaussian processes are inherently probabilistic and suitable for making decisions in situations of high uncertainty. The results are presented in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Cross validation results of different ensemble methods compared to the support vector machine-only model, using the combined feature set.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="310"/>
              <col width="210"/>
              <col width="120"/>
              <col width="130"/>
              <col width="230"/>
              <thead>
                <tr valign="top">
                  <td>Performance measures</td>
                  <td>Support vector machine only, mean (SD)</td>
                  <td>Voting, mean (SD)</td>
                  <td>Stacking, mean (SD)</td>
                  <td>Feature-weighted linear stacking<sup>a</sup>, mean (SD)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Accuracy (%)</td>
                  <td>58.2 (5.1)</td>
                  <td>56.5 (5.0)</td>
                  <td>59.1 (5.1)</td>
                  <td>5.92 (5.3)</td>
                </tr>
                <tr valign="top">
                  <td>Sensitivity (%)</td>
                  <td>56.4 (6.8)</td>
                  <td>54.9 (9.1)</td>
                  <td>57.4 (7.8)</td>
                  <td>57.4 (7.6)</td>
                </tr>
                <tr valign="top">
                  <td>Specificity (%)</td>
                  <td>60.0 (7.0)</td>
                  <td>58.1 (8.2)</td>
                  <td>60.9 (7.4)</td>
                  <td>61.1 (7.4)</td>
                </tr>
                <tr valign="top">
                  <td>Area under the receiver operating characteristic curve (%)</td>
                  <td>60.7 (5.9)</td>
                  <td>59.1 (5.6)</td>
                  <td>62.2 (5.8)</td>
                  <td>62.3 (5.9)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>There is a 70.6% probability that the average performance of the feature-weighted linear stacking ensemble outperforms the support vector machine-only model.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>Training ensembles is more computationally expensive; however, in practice, making a prediction from a pretrained model will take a negligible amount of time. Larger data sets may require the use of localized approximations for polynomially computable models such as SVMs and Gaussian processes. However, a major disadvantage of ensembles is the <italic>black box</italic> effect, where their predictions are effectively uninterpretable.</p>
        </sec>
        <sec>
          <title>Data Augmentation</title>
          <p>Some features were highly sensitive to minor fluctuations in the signal, with their value changing drastically depending on the segment used. Many of these features were not length invariant, and 10% varied by over 0.5 SDs when computed over the same phonation, offset by 0.1 seconds. We computed seven 1.5-second samples from each phonation, ranging from the 1.5- to 4.5-second mark with a 0.5-second step size. We experimented with taking the mean over all 7 values as well as augmenting the data by using the additional samples as extra CV input (ensuring that phonations from the same participant appeared in the same training set or test set). The results are presented in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Cross validation results of basic data augmentation techniques with the combined feature set and the support vector machine-only model.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="490"/>
              <col width="170"/>
              <col width="150"/>
              <col width="190"/>
              <thead>
                <tr valign="top">
                  <td>Performance measures</td>
                  <td>Original, mean (SD)</td>
                  <td>Mean,<sup>a</sup> mean (SD)</td>
                  <td>Augmented, mean (SD)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Accuracy (%)</td>
                  <td>58.2 (5.1)</td>
                  <td>58.7 (4.5)</td>
                  <td>57.3 (3.7)</td>
                </tr>
                <tr valign="top">
                  <td>Sensitivity (%)</td>
                  <td>56.4 (6.8)</td>
                  <td>56.5 (6.8)</td>
                  <td>54.8 (5.8)</td>
                </tr>
                <tr valign="top">
                  <td>Specificity (%)</td>
                  <td>60.0 (7.0)</td>
                  <td>60.8 (7.5)</td>
                  <td>59.8 (5.8)</td>
                </tr>
                <tr valign="top">
                  <td>Area under the receiver operating characteristic curve (%)</td>
                  <td>60.7 (5.9)</td>
                  <td>61.1 (5.1)</td>
                  <td>60.2 (4.4)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table4fn1">
                <p><sup>a</sup>There is a 59.3% probability that the performance with the mean augmented features is better than the nonaugmented features.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>Augmentation did not seem to prove useful in overcoming low-quality data and unstable features and seemed to decrease performance. It is possible that sampling from a shorter window exacerbates the instability of the features and that even if one of the windows was more informative than others, that window might not be the same for all recordings. This may essentially introduce more noise into the training data and therefore have an overall negative effect on model performance.</p>
          <p>Augmentation proved beneficial when taking the mean over all segments; however, it was not useful when simply including the additional segments as CV data. This is likely because taking the mean reduces the instability and noise of the features, whereas including all the segments exacerbates the problem and introduces more noise into the entire feature set.</p>
        </sec>
      </sec>
      <sec>
        <title>Final Results: Performance in Participants With No Speech Difficulties</title>
        <p>After developing a decent model to classify PD based on speech, we investigated what it could offer to real-world diagnosis. The raw performance is clearly insufficient to replace neurologists; however, we have shown that the performance bound has not been reached—additional, higher quality data will greatly improve results, along with better and more informative features.</p>
        <p>First, we investigated whether it would be possible to detect symptoms imperceptible to a neurologist. If this is possible, the combination of both could potentially increase the accuracy of diagnosis. To do this, a set of PD participants who had <italic>no speech difficulties</italic> (NSDs) was first removed from the data set before any experimentation (including those mentioned in the previous sections) to prevent overfitting during the model evaluation stage. This relied on a field of the mPower UPDRS survey, which defaulted to zero, which we are aware relies on the honestly/reliability of participants. This created a subset of 81 participants (of the previous 4112) who had PD and NSDs.</p>
        <p>From the HC participants not used in CV/model evaluation stage, 81 participants were chosen such that they exactly matched the gender of each NSD participant and as closely matched the age as possible. We combined the 2 to form a test set of 162 participants and used the FWLS ensemble trained on the CV set to evaluate the test set. No data augmentation was performed. This is presented in <xref ref-type="table" rid="table5">Table 5</xref>. Surprisingly, there was an increase in sensitivity between diagnosis of participants with perceptible dysphonia (as indicated by participants having speech difficulties) compared with the diagnosis of those with imperceptible dysphonia (as indicated by participants having NSDs). This implies that there must exist some features that capture information regarding the disease state of a person but does not relate to audible dysphonia.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Performance of the feature-weighted linear stacking ensemble on participants with no audible symptoms and previously unseen data.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="380"/>
            <col width="220"/>
            <col width="190"/>
            <col width="210"/>
            <thead>
              <tr valign="top">
                <td>Performance measures</td>
                <td>Cross-validation mean</td>
                <td>Cross-validation SD</td>
                <td>No speech difficulty</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Accuracy (%)</td>
                <td>59.2</td>
                <td>5.3</td>
                <td>59.3</td>
              </tr>
              <tr valign="top">
                <td>Sensitivity (%)</td>
                <td>57.4</td>
                <td>7.6</td>
                <td>63.0</td>
              </tr>
              <tr valign="top">
                <td>Specificity (%)</td>
                <td>61.1</td>
                <td>7.4</td>
                <td>55.6</td>
              </tr>
              <tr valign="top">
                <td>Area under the receiver operating characteristic curve (%)</td>
                <td>62.3</td>
                <td>5.9</td>
                <td>66.7</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>We hypothesized that this is possible because of the more abstract features, which are not related to audible symptoms. To investigate, for each feature, we checked two matters: first, whether the distribution over NSD and PD was similar (ie, captured information about disease state), and second, whether the distribution between NSD and control was different (ie, did not relate to audible dysphonia), implying that the feature is likely discriminative yet inaudible.</p>
        <p>To perform significance testing, we first employed a normality test on all features across all groups. If a single feature was normal across all groups (ie, PD, NSD, and HC), then we employed a one-way analysis of variance (ANOVA) to test for significant differences, followed by a Tukey honestly significant difference post hoc. Groups were considered to be sampled from different distributions of a <italic>P</italic> value of .05. If that feature was not normal across all groups, then a Kruskal-Wallis ANOVA was used, followed by a Dunn-Bonferroni posthoc test. Similarly, a value of <italic>P</italic>=.04 is required to say that the feature was sampled from different distributions. Note that because we are only interested in 2 posthoc comparisons (between NSD-PD and NSD-HC), the posthoc tests overcorrected the <italic>P</italic> values. This meant that we can be more confident in any significant difference detected.</p>
        <p>We expected that abstract features such as those that try to capture complexity (eg, sample entropy) were likely to be inaudible. These were not biologically motivated and more sensitive to high-frequency information to which the human auditory system was not. This was confirmed in <xref rid="figure3" ref-type="fig">Figure 3</xref>, where a significant difference was detected for mean log energy between the NSD and control groups, yet no significant difference was detected between the NSD and PD groups, for males only.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Violin plot of mean_Log energy for males (blue) and females (orange). For males, a significant difference was detected between the no speech difficulty and control groups (<italic>P</italic>&lt;.00002), but not between the no speech difficulty and Parkinson disease groups (<italic>P</italic>=.13). F: female; Log: logarithmic; M: male; NSD: no speech difficulties; PD: Parkinson disease.</p>
          </caption>
          <graphic xlink:href="biomedeng_v5i1e13611_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>In the full results, we found that features such as energy, entropy, and their corresponding coefficients were inaudible, whereas features such as jitter, those derived from fundamental frequency, MFCC, and their corresponding coefficients were audible.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we have shown that features used in prior literature on small data sets do not perform well when extrapolated to more real-world, much larger data sets such as mPower. Owing to natural variation in speech, the separation of healthy individuals and those with PD is not as simple as previously believed. We have presented significant performance improvements with an additional set of features and techniques such as assembling and data augmentation. Importantly, we have demonstrated this in a robust environment that is well guarded against overfitting.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Although performance is currently insufficient to substitute for a clinician’s diagnosis, significant improvements from simple data augmentation, ensemble models, and additional features imply that peak performance has not yet been achieved. The power of ML only increases as more data become available.</p>
        <p>We have also shown that some features used are capable of detecting symptoms of the PD state, yet are <italic>imperceptible to human hearing</italic>. This is a very promising result for the field, with the possibility that a large robust model may eventually outperform humans. For now, these models are a low-cost tool for clinicians to validate their diagnosis; a positive result may be a flag to perform further checks on the patient. This also suggests that vocal phonation features could be used as part of a set of noninvasive biomarkers for PD.</p>
        <p>The biggest barrier to the introduction of ML in the clinical setting is trust. This relies on <italic>either</italic> a strong understanding of the models and features <italic>or</italic> good performance on a substantially sized data set with robust evaluation approaches. We believe that developing a deep understanding of ML in clinicians will become increasingly difficult, as models and features become more complex. Thus, it may be best to focus on providing larger data sets. The mPower data set makes great strides in size and availability, but it lacks data control. The field would benefit greatly from a standardized data set against which the performance of models could be empirically evaluated.</p>
        <p>Many avenues still remain unexplored. The diagnosis of PD often involves testing a patient’s response to medication, such as levodopa. Additional information from phonation samples before and after levodopa consumption may greatly improve performance. We focused only on traditional ML approaches based on signal processing. A notable weakness of feature engineering is information loss, as it is difficult to perfectly describe a signal. Structured neural networks are suitable for making predictions from a raw data stream, such as computer vision and neural networks. In our testing, simple convolutional and recurrent neural networks have achieved similar performance to our best models and greatly improved performance when combined with feature engineering. However, they are more difficult to interpret.</p>
        <p>Further improvements could be seen in multidimensional data sets using data from more than one source (eg, postural sway, gait, and finger tapping, all of which could be measured on smartphone devices). Measuring these during clinical visits in a controlled setting under standardized conditions would produce substantially cleaner data at minimal cost, but it is essential to have the cooperation of the clinical and patient communities. Our research provides a first step in establishing the great value these tools could provide, not just in PD.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ANOVA</term>
          <def>
            <p>analysis of variance</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CV</term>
          <def>
            <p>cross-validation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EEG</term>
          <def>
            <p>electroencephalogram</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">FWLS</term>
          <def>
            <p>feature-weighted linear stacking</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">GQ</term>
          <def>
            <p>Glottal Quotient</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">HC</term>
          <def>
            <p>healthy control</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HNR</term>
          <def>
            <p>harmonics-to-noise ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">MFCC</term>
          <def>
            <p>Mel-frequency cepstral coefficient</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">NSD</term>
          <def>
            <p>no speech difficulty</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">PD</term>
          <def>
            <p>Parkinson disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">RBF</term>
          <def>
            <p>radial basis function</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">RPDE</term>
          <def>
            <p>recurrence period density entropy</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">SVD</term>
          <def>
            <p>singular value decomposition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">UPDRS</term>
          <def>
            <p>Unified Parkinson's Disease Rating Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">VFER</term>
          <def>
            <p>vocal fold excitation ratio</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was supported by the <italic>Australian Government Research Training Program</italic> Scholarship and delivered in partnership with <italic>Our Health in Our Hands</italic>, a strategic initiative of the Australian National University, which aims to transform health care by developing new personalized health technologies and solutions in collaboration with patients, clinicians, and health care providers. The authors would like to thank Alex Smith, Mehika Manocha, and Professor Christian Lueck for their helpful comments and suggestions.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Savitt</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Dawson</surname>
              <given-names>VL</given-names>
            </name>
            <name name-style="western">
              <surname>Dawson</surname>
              <given-names>TM</given-names>
            </name>
          </person-group>
          <article-title>Diagnosis and treatment of Parkinson disease: molecules to medicine</article-title>
          <source>J Clin Invest</source>
          <year>2006</year>
          <month>07</month>
          <volume>116</volume>
          <issue>7</issue>
          <fpage>1744</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1172/JCI29178"/>
          </comment>
          <pub-id pub-id-type="doi">10.1172/JCI29178</pub-id>
          <pub-id pub-id-type="medline">16823471</pub-id>
          <pub-id pub-id-type="pmcid">PMC1483178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fahn</surname>
              <given-names>S</given-names>
            </name>
            <collab>Parkinson Study Group</collab>
          </person-group>
          <article-title>Does levodopa slow or hasten the rate of progression of Parkinson's disease?</article-title>
          <source>J Neurol</source>
          <year>2005</year>
          <month>10</month>
          <volume>252</volume>
          <issue>Suppl 4</issue>
          <fpage>IV37</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.1007/s00415-005-4008-5</pub-id>
          <pub-id pub-id-type="medline">16222436</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tolosa</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wenning</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Poewe</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>The diagnosis of Parkinson's disease</article-title>
          <source>Lancet Neurol</source>
          <year>2006</year>
          <month>01</month>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>75</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.1016/S1474-4422(05)70285-4</pub-id>
          <pub-id pub-id-type="medline">16361025</pub-id>
          <pub-id pub-id-type="pii">S1474-4422(05)70285-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thenganatt</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Jankovic</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Parkinson disease subtypes</article-title>
          <source>JAMA Neurol</source>
          <year>2014</year>
          <month>04</month>
          <volume>71</volume>
          <issue>4</issue>
          <fpage>499</fpage>
          <lpage>504</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaneurol.2013.6233</pub-id>
          <pub-id pub-id-type="medline">24514863</pub-id>
          <pub-id pub-id-type="pii">1827554</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Quinn</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Parkinsonism--recognition and differential diagnosis</article-title>
          <source>Br Med J</source>
          <year>1995</year>
          <month>02</month>
          <day>18</day>
          <volume>310</volume>
          <issue>6977</issue>
          <fpage>447</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/7646647"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.310.6977.447</pub-id>
          <pub-id pub-id-type="medline">7646647</pub-id>
          <pub-id pub-id-type="pmcid">PMC2548823</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brooks</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>Parkinson's disease: diagnosis</article-title>
          <source>Parkinsonism Relat Disord</source>
          <year>2012</year>
          <month>01</month>
          <volume>18</volume>
          <fpage>S31</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1016/S1353-8020(11)70012-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jankovic</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rajput</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>McDermott</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Perl</surname>
              <given-names>DP</given-names>
            </name>
          </person-group>
          <article-title>The evolution of diagnosis in early Parkinson disease. Parkinson study group</article-title>
          <source>Arch Neurol</source>
          <year>2000</year>
          <month>03</month>
          <volume>57</volume>
          <issue>3</issue>
          <fpage>369</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1001/archneur.57.3.369</pub-id>
          <pub-id pub-id-type="medline">10714663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scherzer</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Eklund</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Morse</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Locascio</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fefer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schwarzschild</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Schlossmacher</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Hauser</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Vance</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Sudarsky</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>Standaert</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Growdon</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>RV</given-names>
            </name>
            <name name-style="western">
              <surname>Gullans</surname>
              <given-names>SR</given-names>
            </name>
          </person-group>
          <article-title>Molecular markers of early Parkinson's disease based on gene expression in blood</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2007</year>
          <month>01</month>
          <day>16</day>
          <volume>104</volume>
          <issue>3</issue>
          <fpage>955</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&amp;pmid=17215369"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.0610204104</pub-id>
          <pub-id pub-id-type="medline">17215369</pub-id>
          <pub-id pub-id-type="pii">0610204104</pub-id>
          <pub-id pub-id-type="pmcid">PMC1766335</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Quinn</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Peskind</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Galasko</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jankovic</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zabetian</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Leverenz</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Baird</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Montine</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hancock</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bradner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>UJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>DJ-1 and alpha-synuclein in human cerebrospinal fluid as biomarkers of Parkinson's disease</article-title>
          <source>Brain</source>
          <year>2010</year>
          <month>03</month>
          <volume>133</volume>
          <issue>Pt 3</issue>
          <fpage>713</fpage>
          <lpage>26</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20157014"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/brain/awq008</pub-id>
          <pub-id pub-id-type="medline">20157014</pub-id>
          <pub-id pub-id-type="pii">awq008</pub-id>
          <pub-id pub-id-type="pmcid">PMC2842513</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mohan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tarolli</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Elson</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Spear</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Glidden</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Terzis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dorsey</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Saria</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Using smartphones and machine learning to quantify Parkinson disease severity: the mobile Parkinson disease score</article-title>
          <source>JAMA Neurol</source>
          <year>2018</year>
          <month>07</month>
          <day>1</day>
          <volume>75</volume>
          <issue>7</issue>
          <fpage>876</fpage>
          <lpage>80</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29582075"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamaneurol.2018.0809</pub-id>
          <pub-id pub-id-type="medline">29582075</pub-id>
          <pub-id pub-id-type="pii">2676504</pub-id>
          <pub-id pub-id-type="pmcid">PMC5885192</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Spielman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>LO</given-names>
            </name>
          </person-group>
          <article-title>Novel speech signal processing algorithms for high-accuracy classification of Parkinson's disease</article-title>
          <source>IEEE Trans Biomed Eng</source>
          <year>2012</year>
          <month>05</month>
          <volume>59</volume>
          <issue>5</issue>
          <fpage>1264</fpage>
          <lpage>71</lpage>
          <pub-id pub-id-type="doi">10.1109/TBME.2012.2183367</pub-id>
          <pub-id pub-id-type="medline">22249592</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bot</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Suver</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Neto</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Kellen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bare</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Doerr</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pratap</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wilbanks</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dorsey</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Friend</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Trister</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>The mPower study, Parkinson disease mobile data collected using ResearchKit</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>03</month>
          <day>3</day>
          <volume>3</volume>
          <fpage>160011</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26938265"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.11</pub-id>
          <pub-id pub-id-type="medline">26938265</pub-id>
          <pub-id pub-id-type="pii">sdata201611</pub-id>
          <pub-id pub-id-type="pmcid">PMC4776701</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rusz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cmejla</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tykalova</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ruzickova</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Klempir</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Majerova</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Picmausova</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ruzicka</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Imprecise vowel articulation as a potential early marker of Parkinson's disease: effect of speaking task</article-title>
          <source>J Acoust Soc Am</source>
          <year>2013</year>
          <month>09</month>
          <volume>134</volume>
          <issue>3</issue>
          <fpage>2171</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1121/1.4816541</pub-id>
          <pub-id pub-id-type="medline">23967947</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Little</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hunter</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Spielman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Suitability of dysphonia measurements for telemonitoring of Parkinson's disease</article-title>
          <source>IEEE Trans Biomed Eng</source>
          <year>2009</year>
          <month>04</month>
          <volume>56</volume>
          <issue>4</issue>
          <fpage>1015</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21399744"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/TBME.2008.2005954</pub-id>
          <pub-id pub-id-type="medline">21399744</pub-id>
          <pub-id pub-id-type="pmcid">PMC3051371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hazan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hilu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Manevitz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Sapir</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Early Diagnosis of Parkinson's Disease via Machine Learning on Speech Data</article-title>
          <source>27th Convention of Electrical and Electronics Engineers in Israel</source>
          <year>2012</year>
          <conf-name>EEEI'12</conf-name>
          <conf-date>November 14-17,  2012</conf-date>
          <conf-loc>Eilat, Israel</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/6377065"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/eeei.2012.6377065</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Penny</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rezek</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Temporal and spatial complexity measures for electroencephalogram based brain-computer interfacing</article-title>
          <source>Med Biol Eng Comput</source>
          <year>1999</year>
          <month>01</month>
          <volume>37</volume>
          <issue>1</issue>
          <fpage>93</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1007/BF02513272</pub-id>
          <pub-id pub-id-type="medline">10396848</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>ICASSP 90. 1990 International Conference on Acoustics, Speech and Signal Processing</article-title>
          <source>Proceedings of the International Conference on Acoustics, Speech, and Signal Processing</source>
          <year>1990</year>
          <conf-name>ICASSP'90</conf-name>
          <conf-date>April 3-6, 1990</conf-date>
          <conf-loc>Albuquerque, NM</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/115702"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/icassp.1990.115547</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Horii</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Jitter and shimmer differences among sustained vowel phonations</article-title>
          <source>J Speech Hear Res</source>
          <year>1982</year>
          <month>03</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>12</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1044/jshr.2501.12</pub-id>
          <pub-id pub-id-type="medline">7087413</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zañartu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Robust fundamental frequency estimation in sustained vowels: detailed algorithmic comparisons and information fusion with adaptive Kalman filtering</article-title>
          <source>J Acoust Soc Am</source>
          <year>2014</year>
          <month>05</month>
          <volume>135</volume>
          <issue>5</issue>
          <fpage>2885</fpage>
          <lpage>901</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24815269"/>
          </comment>
          <pub-id pub-id-type="doi">10.1121/1.4870484</pub-id>
          <pub-id pub-id-type="medline">24815269</pub-id>
          <pub-id pub-id-type="pmcid">PMC4032429</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yumoto</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gould</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Baer</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Harmonics-to-noise ratio as an index of the degree of hoarseness</article-title>
          <source>J Acoust Soc Am</source>
          <year>1982</year>
          <month>06</month>
          <volume>71</volume>
          <issue>6</issue>
          <fpage>1544</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1121/1.387808</pub-id>
          <pub-id pub-id-type="medline">7108029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Michaelis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gramss</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Strube</surname>
              <given-names>HW</given-names>
            </name>
          </person-group>
          <article-title>Glottal to-noise excitation ratio - a new measure for describing pathological voices</article-title>
          <source>Acta Acustica United with Acustica</source>
          <year>1997</year>
          <volume>83</volume>
          <issue>4</issue>
          <fpage>700</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pdfs.semanticscholar.org/0457/dd95c33bdc38f5c0e7a96059a3fd556e4e6c.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>LO</given-names>
            </name>
          </person-group>
          <article-title>Nonlinear speech analysis algorithms mapped to a standard metric achieve clinically useful quantification of average Parkinson's disease symptom severity</article-title>
          <source>J R Soc Interface</source>
          <year>2011</year>
          <month>06</month>
          <day>6</day>
          <volume>8</volume>
          <issue>59</issue>
          <fpage>842</fpage>
          <lpage>55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21084338"/>
          </comment>
          <pub-id pub-id-type="doi">10.1098/rsif.2010.0456</pub-id>
          <pub-id pub-id-type="medline">21084338</pub-id>
          <pub-id pub-id-type="pii">rsif.2010.0456</pub-id>
          <pub-id pub-id-type="pmcid">PMC3104343</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kounoudes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Naylor</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Brookes</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The DYPSA Algorithm for Estimation of Glottal Closure Instants in Voiced Speech</article-title>
          <source>International Conference on Acoustics, Speech, and Signal Processing</source>
          <year>2002</year>
          <conf-name>ICASSP'02</conf-name>
          <conf-date>May 7-11, 2002</conf-date>
          <conf-loc>Orlando, FL</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/5743726"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/icassp.2002.1005748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Costello</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Moroz</surname>
              <given-names>IM</given-names>
            </name>
          </person-group>
          <article-title>Exploiting nonlinear recurrence and fractal scaling properties for voice disorder detection</article-title>
          <source>Biomed Eng Online</source>
          <year>2007</year>
          <month>06</month>
          <day>26</day>
          <volume>6</volume>
          <fpage>23</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://biomedical-engineering-online.biomedcentral.com/articles/10.1186/1475-925X-6-23"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1475-925X-6-23</pub-id>
          <pub-id pub-id-type="medline">17594480</pub-id>
          <pub-id pub-id-type="pii">1475-925X-6-23</pub-id>
          <pub-id pub-id-type="pmcid">PMC1913514</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hegger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kantz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Matassini</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Denoising human speech signals using chaoslike features</article-title>
          <source>Phys Rev Lett</source>
          <year>2000</year>
          <month>04</month>
          <day>3</day>
          <volume>84</volume>
          <issue>14</issue>
          <fpage>3197</fpage>
          <lpage>200</lpage>
          <pub-id pub-id-type="doi">10.1103/PhysRevLett.84.3197</pub-id>
          <pub-id pub-id-type="medline">11019046</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenstein</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>de Luca</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>A practical method for calculating largest Lyapunov exponents from small data sets</article-title>
          <source>Physica D</source>
          <year>1993</year>
          <month>05</month>
          <volume>65</volume>
          <issue>1-2</issue>
          <fpage>117</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.1016/0167-2789(93)90009-P</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mandelbrot</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>How long is the coast of Britain? Statistical self-similarity and fractional dimension</article-title>
          <source>Science</source>
          <year>1967</year>
          <month>05</month>
          <day>5</day>
          <volume>156</volume>
          <issue>3775</issue>
          <fpage>636</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1126/science.156.3775.636</pub-id>
          <pub-id pub-id-type="medline">17837158</pub-id>
          <pub-id pub-id-type="pii">156/3775/636</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doyle</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Dugan</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Humphries</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Newton</surname>
              <given-names>RU</given-names>
            </name>
          </person-group>
          <article-title>Discriminating between elderly and young using a fractal dimension analysis of centre of pressure</article-title>
          <source>Int J Med Sci</source>
          <year>2004</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>11</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.medsci.org/v01p0011.htm"/>
          </comment>
          <pub-id pub-id-type="doi">10.7150/ijms.1.11</pub-id>
          <pub-id pub-id-type="medline">15912186</pub-id>
          <pub-id pub-id-type="pmcid">PMC1074506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schmit</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Dalvi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sahay</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shear</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Shockley</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Pun</surname>
              <given-names>RY</given-names>
            </name>
          </person-group>
          <article-title>Deterministic center of pressure patterns characterize postural instability in Parkinson's disease</article-title>
          <source>Exp Brain Res</source>
          <year>2006</year>
          <month>01</month>
          <volume>168</volume>
          <issue>3</issue>
          <fpage>357</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1007/s00221-005-0094-y</pub-id>
          <pub-id pub-id-type="medline">16047175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Richman</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Moorman</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Physiological time-series analysis using approximate entropy and sample entropy</article-title>
          <source>Am J Physiol Heart Circ Physiol</source>
          <year>2000</year>
          <month>06</month>
          <volume>278</volume>
          <issue>6</issue>
          <fpage>H2039</fpage>
          <lpage>49</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://journals.physiology.org/doi/full/10.1152/ajpheart.2000.278.6.H2039?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1152/ajpheart.2000.278.6.H2039</pub-id>
          <pub-id pub-id-type="medline">10843903</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Costa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberger</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Multiscale entropy analysis of biological signals</article-title>
          <source>Phys Rev E Stat Nonlin Soft Matter Phys</source>
          <year>2005</year>
          <month>02</month>
          <volume>71</volume>
          <issue>2 Pt 1</issue>
          <fpage>021906</fpage>
          <pub-id pub-id-type="doi">10.1103/PhysRevE.71.021906</pub-id>
          <pub-id pub-id-type="medline">15783351</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eyben</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wöllmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schuller</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>OpenSmile: The Munich Versatile and Fast Open-Source Audio Feature Extractor</article-title>
          <source>Proceedings of the 18th ACM international conference on Multimedia</source>
          <year>2010</year>
          <conf-name>ACM'10</conf-name>
          <conf-date>October 25-29, 2010</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/1873951.1874246"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/1873951.1874246</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geissmann</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Python Package for Sleep Scoring From EEG Data</article-title>
          <source>GitHub</source>
          <year>2017</year>
          <access-date>2017-10-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/gilestrolab/pyrem">https://github.com/gilestrolab/pyrem</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scholzel</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Nonlinear Measures for Dynamical Systems (NoLDS)</article-title>
          <source>GitHub</source>
          <access-date>2017-10-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/CSchoel/nolds">https://github.com/CSchoel/nolds</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Phase Space Reconstruction: PyPSR</article-title>
          <source>GitHub</source>
          <year>2017</year>
          <access-date>2017-10-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/hsharrison/pypsr">https://github.com/hsharrison/pypsr</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Accurate Telemonitoring of Parkinson’s Disease Symptom Severity Using Nonlinear Speech Signal Processing and Statistical Machine Learning</article-title>
          <source>Oxford University Research Archive: ORA</source>
          <year>2012</year>
          <access-date>2020-06-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ora.ox.ac.uk/objects/uuid:2a43b92a-9cd5-4646-8f0f-81dbe2ba9d74">https://ora.ox.ac.uk/objects/uuid:2a43b92a-9cd5-4646-8f0f-81dbe2ba9d74</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kanters</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Solomon</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chon</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Automatic selection of the threshold value R for approximate entropy</article-title>
          <source>IEEE Trans Biomed Eng</source>
          <year>2008</year>
          <month>08</month>
          <volume>55</volume>
          <issue>8</issue>
          <fpage>1966</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1109/TBME.2008.919870</pub-id>
          <pub-id pub-id-type="medline">18632359</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Perez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Plastino</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Fisher information and nonlinear dynamics</article-title>
          <source>Physica A</source>
          <year>2001</year>
          <volume>291</volume>
          <issue>1</issue>
          <fpage>523</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/S0378437100005318"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0378-4371(00)00531-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benavoli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Corani</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Demsar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zaffalon</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Time for a change: a tutorial for comparing multiple classifiers through Bayesian analysis</article-title>
          <source>arXivc</source>
          <year>2016</year>
          <month>06</month>
          <day>14</day>
          <comment>epub ahead of print - 1606.04316<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1606.04316"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Papeş</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Soberón</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Rethinking receiver operating characteristic analysis applications in ecological niche modeling</article-title>
          <source>Ecol Model</source>
          <year>2008</year>
          <volume>213</volume>
          <issue>1</issue>
          <fpage>63</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ideas.repec.org/a/eee/ecomod/v213y2008i1p63-72.html"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ecolmodel.2007.11.008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neto</surname>
              <given-names>E C</given-names>
            </name>
            <name name-style="western">
              <surname>Perumal</surname>
              <given-names>T M</given-names>
            </name>
            <name name-style="western">
              <surname>Pratap</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bot</surname>
              <given-names>B M</given-names>
            </name>
            <name name-style="western">
              <surname>Mangravite</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Omberg</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>On the analysis of personalized medication response and classification of case vs control patients in mobile health studies: the mPower case study</article-title>
          <source>Arxiv</source>
          <year>2017</year>
          <comment>epub ahead of print<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1706.09574"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Camacho</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>JG</given-names>
            </name>
          </person-group>
          <article-title>SWIPE: a sawtooth waveform inspired pitch estimator for speech and music</article-title>
          <source>J Acoust Soc Am</source>
          <year>2008</year>
          <month>09</month>
          <volume>124</volume>
          <issue>3</issue>
          <fpage>1638</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1121/1.2951592</pub-id>
          <pub-id pub-id-type="medline">19045655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sill</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Takacs</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>MacKey</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Feature-weighted linear stacking</article-title>
          <source>Arxiv</source>
          <year>2009</year>
          <fpage>-</fpage>
          <comment>epub ahead of print(0911.0460)<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/0911.0460"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koren</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>The BellKor Solution to the Netflix Grand Prize</article-title>
          <source>The Netflix Prize</source>
          <year>2009</year>
          <access-date>2020-06-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.netflixprize.com/assets/GrandPrize2009_BPC_BellKor.pdf">https://www.netflixprize.com/assets/GrandPrize2009_BPC_BellKor.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
