<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i10e26305</article-id>
      <article-id pub-id-type="pmid">34665148</article-id>
      <article-id pub-id-type="doi">10.2196/26305</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Detecting Parkinson Disease Using a Web-Based Speech Task: Observational Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Kukafka</surname>
            <given-names>Rita</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Goni</surname>
            <given-names>Maria</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Fincham</surname>
            <given-names>Colin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhai</surname>
            <given-names>Dh</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Rahman</surname>
            <given-names>Wasifur</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Computer Science</institution>
            <institution>University of Rochester</institution>
            <addr-line>250 Hutchinson Rd</addr-line>
            <addr-line>Rochester, NY, 14620</addr-line>
            <country>United States</country>
            <phone>1 5857487677</phone>
            <email>echowdh2@ur.rochester.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9736-442X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Sangwu</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3930-3079</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Islam</surname>
            <given-names>Md Saiful</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3725-3493</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Antony</surname>
            <given-names>Victor Nikhil</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4722-2041</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Ratnu</surname>
            <given-names>Harshil</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4791-1867</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Ali</surname>
            <given-names>Mohammad Rafayet</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7878-7910</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Mamun</surname>
            <given-names>Abdullah Al</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8757-9948</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Wagner</surname>
            <given-names>Ellen</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7388-8504</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Jensen-Roberts</surname>
            <given-names>Stella</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7269-3502</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Waddell</surname>
            <given-names>Emma</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8863-0335</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Myers</surname>
            <given-names>Taylor</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8223-2483</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Pawlik</surname>
            <given-names>Meghan</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9025-0382</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Soto</surname>
            <given-names>Julia</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7885-862X</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author">
          <name name-style="western">
            <surname>Coffey</surname>
            <given-names>Madeleine</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9939-4414</ext-link>
        </contrib>
        <contrib id="contrib15" contrib-type="author">
          <name name-style="western">
            <surname>Sarkar</surname>
            <given-names>Aayush</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3603-1533</ext-link>
        </contrib>
        <contrib id="contrib16" contrib-type="author">
          <name name-style="western">
            <surname>Schneider</surname>
            <given-names>Ruth</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8094-4041</ext-link>
        </contrib>
        <contrib id="contrib17" contrib-type="author">
          <name name-style="western">
            <surname>Tarolli</surname>
            <given-names>Christopher</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0422-4020</ext-link>
        </contrib>
        <contrib id="contrib18" contrib-type="author">
          <name name-style="western">
            <surname>Lizarraga</surname>
            <given-names>Karlo</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9766-6252</ext-link>
        </contrib>
        <contrib id="contrib19" contrib-type="author">
          <name name-style="western">
            <surname>Adams</surname>
            <given-names>Jamie</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1170-6688</ext-link>
        </contrib>
        <contrib id="contrib20" contrib-type="author">
          <name name-style="western">
            <surname>Little</surname>
            <given-names>Max A</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1507-3822</ext-link>
        </contrib>
        <contrib id="contrib21" contrib-type="author">
          <name name-style="western">
            <surname>Dorsey</surname>
            <given-names>E Ray</given-names>
          </name>
          <degrees>MBA, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5140-1248</ext-link>
        </contrib>
        <contrib id="contrib22" contrib-type="author">
          <name name-style="western">
            <surname>Hoque</surname>
            <given-names>Ehsan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4781-4733</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Computer Science</institution>
        <institution>University of Rochester</institution>
        <addr-line>Rochester, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Center for Health and Technology</institution>
        <institution>University of Rochester Medical Center</institution>
        <addr-line>Rochester, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Neurology</institution>
        <institution>University of Rochester Medical Center</institution>
        <addr-line>Rochester, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>School of Computer Science</institution>
        <institution>University of Birmingham</institution>
        <addr-line>Birmingham</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>MIT Media Lab</institution>
        <institution>Massachusetts Institute of Technology</institution>
        <addr-line>Cambridge, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Wasifur Rahman <email>echowdh2@ur.rochester.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>10</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>19</day>
        <month>10</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>10</issue>
      <elocation-id>e26305</elocation-id>
      <history>
        <date date-type="received">
          <day>19</day>
          <month>2</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>3</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>13</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>7</day>
          <month>8</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Wasifur Rahman, Sangwu Lee, Md Saiful Islam, Victor Nikhil Antony, Harshil Ratnu, Mohammad Rafayet Ali, Abdullah Al Mamun, Ellen Wagner, Stella Jensen-Roberts, Emma Waddell, Taylor Myers, Meghan Pawlik, Julia Soto, Madeleine Coffey, Aayush Sarkar, Ruth Schneider, Christopher Tarolli, Karlo Lizarraga, Jamie Adams, Max A Little, E Ray Dorsey, Ehsan Hoque. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 19.10.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/10/e26305" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Access to neurological care for Parkinson disease (PD) is a rare privilege for millions of people worldwide, especially in resource-limited countries. In 2013, there were just 1200 neurologists in India for a population of 1.3 billion people; in Africa, the average population per neurologist exceeds 3.3 million people. In contrast, 60,000 people receive a diagnosis of PD every year in the United States alone, and similar patterns of rising PD cases—fueled mostly by environmental pollution and an aging population—can be seen worldwide. The current projection of more than 12 million patients with PD worldwide by 2040 is only part of the picture given that more than 20% of patients with PD remain undiagnosed. Timely diagnosis and frequent assessment are key to ensure timely and appropriate medical intervention, thus improving the quality of life of patients with PD.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>In this paper, we propose a web-based framework that can help anyone anywhere around the world record a short speech task and analyze the recorded data to screen for PD.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We collected data from 726 unique participants (PD: 262/726, 36.1% were women; non-PD: 464/726, 63.9% were women; average age 61 years) from all over the United States and beyond. A small portion of the data (approximately 54/726, 7.4%) was collected in a laboratory setting to compare the performance of the models trained with noisy home environment data against high-quality laboratory-environment data. The participants were instructed to utter a popular pangram containing all the letters in the English alphabet, “the quick brown fox jumps over the lazy dog.” We extracted both standard acoustic features (mel-frequency cepstral coefficients and jitter and shimmer variants) and deep learning–based embedding features from the speech data. Using these features, we trained several machine learning algorithms. We also applied model interpretation techniques such as Shapley additive explanations to ascertain the importance of each feature in determining the model’s output.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We achieved an area under the curve of 0.753 for determining the presence of self-reported PD by modeling the standard acoustic features through the XGBoost—a gradient-boosted decision tree model. Further analysis revealed that the widely used mel-frequency cepstral coefficient features and a subset of previously validated dysphonia features designed for detecting PD from a verbal phonation task (pronouncing “ahh”) influence the model’s decision the most.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our model performed equally well on data collected in a controlled laboratory environment and <italic>in the wild</italic> across different gender and age groups. Using this tool, we can collect data from almost anyone anywhere with an audio-enabled device and help the participants screen for PD remotely, contributing to equity and access in neurological care.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>Parkinson’s disease</kwd>
        <kwd>speech analysis</kwd>
        <kwd>improving access and equity in health care</kwd>
        <kwd>mobile phone</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Parkinson disease (PD) is the fastest-growing neurological disease worldwide. Unfortunately, an estimated 20% of patients with PD remain undiagnosed. This can be largely attributed to the shortage of neurologists worldwide [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>] and limited access to health care. Early diagnosis and continuous monitoring, which allows medication dosage adjustment, are key to managing the symptoms of this incurable disease. The current standard of diagnosis requires in-person clinic visits where an expert assesses the disease symptoms while observing the patients as they perform tasks from the Movement Disorder Society-Unified Parkinson’s Disease Rating Scale (MDS-UPDRS) [<xref ref-type="bibr" rid="ref3">3</xref>]. The MDS-UPDRS includes 24 motor-related tasks to assess speech, facial expression, limb movements, walking, memory, and cognitive abilities. Although many studies have shown success by analyzing hand movements [<xref ref-type="bibr" rid="ref4">4</xref>], limb movement patterns [<xref ref-type="bibr" rid="ref5">5</xref>], and facial expressions [<xref ref-type="bibr" rid="ref6">6</xref>], speech is especially important because approximately 90% of patients with PD exhibit vocal impairment [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>], which is often one of the earliest indicators of PD [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>For speech analysis, researchers have looked into phonations (pronouncing “ahhh”) from audio recordings [<xref ref-type="bibr" rid="ref10">10</xref>] to quantify rhythm, stress, and intonation [<xref ref-type="bibr" rid="ref11">11</xref>]. Little et al [<xref ref-type="bibr" rid="ref12">12</xref>] introduced pitch period entropy (PPE) as a measure of dysphonia to distinguish healthy people from people with PD with 91% accuracy. Later, Tsanas [<xref ref-type="bibr" rid="ref13">13</xref>] expanded on this by calculating 132 dysphonia measures to classify PD versus control with almost 99% accuracy. In addition, Peker et al [<xref ref-type="bibr" rid="ref14">14</xref>] used a novel feature selection technique with a complex-valued artificial neural network. Rueda and Krishnan [<xref ref-type="bibr" rid="ref15">15</xref>] identified a set of mel-frequency cepstral coefficients (MFCCs) and intrinsic mode functions to represent the characteristics of PD. In the domain of analyzing real-life audio data, Wroge et al [<xref ref-type="bibr" rid="ref16">16</xref>] analyzed verbal phonation data collected from smartphones; Vaiciukynas et al [<xref ref-type="bibr" rid="ref17">17</xref>] used a convolutional neural network to detect PD from speech; Vásquez-Correa et al [<xref ref-type="bibr" rid="ref18">18</xref>] collected speech samples with a handheld device in uncontrolled noise conditions; and Dubey et al [<xref ref-type="bibr" rid="ref19">19</xref>] designed a smartwatch-based voice and speech monitoring system for people with PD receiving speech therapies from speech-language pathologists. Although the current state-of-the-art method has shown promising results, it has limitations such as small sample size [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>], oversampling from the same participants [<xref ref-type="bibr" rid="ref14">14</xref>], noise-controlled data collection [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], and age discrepancy between PD and control [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      <p>In this paper, we present our analysis of 726 audio recordings of speech from 36.1% (262/726) individuals with PD and 63.9% (464/726) without PD. The speech recordings were collected using a web-based tool called <italic>Parkinson’s Analysis with Remote Kinetic-tasks</italic> (PARK) [<xref ref-type="bibr" rid="ref22">22</xref>]. The PARK tool instructed the participants to utter a popular pangram containing all the letters in the English alphabet, “The quick brown fox jumps over the lazy dog,” and recorded it. This allowed us to rapidly collect a data set that is more likely to contain real-world variability associated with geographical boundaries, socioeconomic status, age groups, and a wide variety of heterogeneous recording devices. The findings in this study build on this unique real-world data set; thus, we believe it could potentially be generalized for real-world deployments.</p>
      <p>Collecting audio data from individuals often requires in-person visits to the clinic, limiting the number of data points and the diversity within the data. Recent advancements have allowed the collection of tremor data from wearable sensors [<xref ref-type="bibr" rid="ref23">23</xref>] and sleep data from radio frequency signals [<xref ref-type="bibr" rid="ref24">24</xref>]. The existing work with speech and audio analysis uses sophisticated equipment for collecting data that are often noise-free [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref25">25</xref>] and do not contain real-world variability. As a significant portion of the population has access to a mobile device with recording capability (eg, 81% of Americans own a smartphone) [<xref ref-type="bibr" rid="ref26">26</xref>], we opted to use a framework that allows participants to record data from their homes. From the recorded audio files, we extracted acoustic features including MFCCs, which represent the short-term power spectrum of a sound, jitter or shimmer variants (representing pathological voice quality), pitch-related features, spectral power, and dysphonia-related features designed to capture PD-induced vocal impairment [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>In addition, we extracted features from a deep-learning–based encoder—problem agnostic speech encoder (PASE) [<xref ref-type="bibr" rid="ref27">27</xref>], which represents the information contained in a raw audio instance through a list of encoded vectors. These features are modeled with four different machine learning models—support vector machine (SVM), random forest, LightGBM, and XGBoost—to classify individuals with and without PD.</p>
      <p><xref rid="figure1" ref-type="fig">Figure 1</xref> provides an outline of the data analysis system. Our contributions can be summarized as follows:</p>
      <list list-type="bullet">
        <list-item>
          <p>We report findings from one of the largest data sets with real-world variability, containing 726 unique participants mostly from their homes.</p>
        </list-item>
        <list-item>
          <p>We analyzed the audio features of speech to predict PD versus non-PD with an area under the curve (AUC) score of 0.753.</p>
        </list-item>
        <list-item>
          <p>We provide evidence that our model prioritizes MFCC features and a subset of dysphonia features [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref28">28</xref>], which is consistent with previous literature.</p>
        </list-item>
        <list-item>
          <p>Our model performs consistently well when tested on gender- and age-stratified data collected in a controlled laboratory environment and in the wild.</p>
        </list-item>
      </list>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>An outline of our approach for solving the speech task of uttering “The quick brown fox...”.</p>
        </caption>
        <graphic xlink:href="jmir_v23i10e26305_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Recruitment and Data Collection</title>
        <p>We collected data from 726 <italic>unique</italic> participants uttering the sentences, “The quick brown fox jumps over the lazy dog. The dog wakes up and follows the fox into the forest, but again the quick brown fox jumps over the lazy dog,” using PARK [<xref ref-type="bibr" rid="ref29">29</xref>] website. <xref rid="figure2" ref-type="fig">Figure 2</xref> provides a brief overview of the data collection, storage, transfer, and analysis mechanisms. The users are recorded via a webcam and a microphone connected to the PC or laptop, and the recordings are uploaded to a server. <xref rid="figure3" ref-type="fig">Figure 3</xref> shows images of some of the study participants, and <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the age distribution of the participants. The number of participants without PD is 1.8 times the number of participants with PD. Most of the participants with PD are concentrated in the age range of 40 to 80 years. However, participants without PD outnumber those with PD in the age group 20 to 40 years. Similarly, participants with PD significantly outnumber those without PD in the age group of 80 to 90 years. <xref ref-type="table" rid="table1">Table 1</xref> provides the demographic information of the study participants.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>An overview of our data collection, storage, and analysis pipeline.</p>
          </caption>
          <graphic xlink:href="jmir_v23i10e26305_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Some screenshots of our subjects while providing the data. All the subjects except B provided data without any supervision. B, D, E, and F have been diagnosed with Parkinson disease. Electronic informed consent was taken from the participants to use their photos for publication.</p>
          </caption>
          <graphic xlink:href="jmir_v23i10e26305_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>A bar plot showing the age distribution of participants with PD and those without PD in our data set. PD: Parkinson disease.</p>
          </caption>
          <graphic xlink:href="jmir_v23i10e26305_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Demographic composition of our data set (N=726).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="300"/>
            <col width="370"/>
            <col width="300"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Characteristics</td>
                <td>Participants with PD<sup>a</sup></td>
                <td>Participants without PD</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Total, n (%)</td>
                <td>262 (36.1)</td>
                <td>464 (63.9)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Gender, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>101 (38.5)</td>
                <td>300 (64.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>161 (61.4)</td>
                <td>164 (22.5)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age (years), mean (SD)</td>
                <td>65<italic>.</italic>92 (9<italic>.</italic>2)</td>
                <td>57<italic>.</italic>98 (14<italic>.</italic>2)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Country, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>United States</td>
                <td>199 (75.9)</td>
                <td>419 (90.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>63 (24)</td>
                <td>45 (9.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Years since diagnosed, mean (SD)</td>
                <td>7<italic>.</italic>88 (5<italic>.</italic>41)</td>
                <td>N/A<sup>b</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>PD: Parkinson disease.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Among our 726 unique participants, 262 (36.1%) had received the diagnosis of PD, whereas the others were participants without PD. We obtained contact information of patients with PD from local clinics and various PD support groups. Participants without PD were recruited from Amazon Mechanical Turk. During data collection, informed consent of all participants was obtained in accordance with the protocol agreed upon between the researchers and the institutional review board of the University of Rochester. Among the 726 unique participants, only 54 (7.4%) provided data in the laboratory under the guidance of a study coordinator using the PARK tool; the rest of the 672 (92.6%) participants used the PARK system from their homes to provide data. Having participants perform the tasks at home and in the laboratory allowed us to compare the results across both conditions. No participant appeared in either set, and <italic>all</italic> of our participants used the identical PARK protocol.</p>
        <p>The gender distribution in the data set was skewed, especially for female participants. Among all participants, 55.2% (401/726) were women, and 44.8% (325/726) were men. However, among participants with PD, only 38.5% (101/262) were women, and for participants without PD, 64.6% (300/464) were women. Most of the participants with PD were in the age range of 40 to 80 years, but most of the younger (20-40 years) and older (80-90 years) participants were from the group without PD and the group with PD, respectively.</p>
        <p>As our data were collected through a web-based framework, we do not have the MDS-UPDRS scores for our participants because collecting them requires additional input from doctors. Among all the participants in our PD group, only 3 participants replied in affirmative that they had taken medication 2 hours before taking the test; others replied in the negative. Therefore, we assumed that medication effects were negligible for the purposes of this study.</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>During data collection, participants often took some additional time to start to utter the task sentences and stop the recording once the sentences were uttered. Hence, we had a substantial amount of noisy and irrelevant data at the beginning and end of most data instances (<xref rid="figure1" ref-type="fig">Figure 1</xref>). To remove irrelevant data, we used the Penn Phonetics Lab Forced Aligner Toolkit (P2FA) [<xref ref-type="bibr" rid="ref30">30</xref>]. Given an audio file and transcript, it attempts to predict the time boundaries in which each of the words in the transcript was pronounced. P2FA applies a combination of hidden Markov models [<xref ref-type="bibr" rid="ref31">31</xref>] to predict the most likely sequence of phonemes for a given audio and Gaussian mixture models to combine those phonemes into words and obtain their time boundary using a predefined dictionary [<xref ref-type="bibr" rid="ref32">32</xref>]. From the output of this system, we can obtain the starting time of the first word recognized by the P2FA and the ending time of the last word recognized by the P2FA. We used the audio segments between them for further analysis.</p>
      </sec>
      <sec>
        <title>Acoustic Features Extraction</title>
        <p>We extracted features by combining outputs of multiple sources: Praat features [<xref ref-type="bibr" rid="ref33">33</xref>] obtained through the Parselmouth Python interface [<xref ref-type="bibr" rid="ref34">34</xref>] and the previously used dysphonia features relevant for PD analysis [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. After calculating all the features, we constructed a correlation matrix of the feature values to calculate the degree of correlation between them. Then, we iterated over each pair of features in an unordered fashion, and if the correlation coefficient between them was above 0.9, we dropped one of those features from further analysis [<xref ref-type="bibr" rid="ref37">37</xref>]. <xref ref-type="table" rid="table2">Table 2</xref> contains a short overview of the features used in our analysis; the feature names in italicized text are those used for building the models. We provide a more comprehensive description of the features in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Some of our definitions were adapted from the official Praat documentation [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Names of all the features, code source used for collecting them, and a short description<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="220"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="550"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Feature</td>
                <td colspan="2">Code source</td>
                <td>Short description</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>Pitch</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MedianPitch</italic>
                  <sup>b</sup>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">Median principal frequency</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MeanPitch</italic>
                </td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Mean principal frequency</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>StdDevPitch</italic>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">SD in principal frequency</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Jitter</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MeanJitter</italic>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">Perturbation in principal frequency (mean variation)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MedianJitter</italic>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">Perturbation in principal frequency (median variation)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LocalJitter</td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Average absolute difference between consecutive periods, divided by the average period</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>LocalAbsoluteJitter</italic>
                </td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Average absolute difference between consecutive periods measured in seconds</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>RapJitter</td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Average absolute difference between a period and the average of it and its two neighbors</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Ppq5Jitter</td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">5-point period perturbation quotient</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>DdpJitter</italic>
                </td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Difference of differences of periods of principal frequency</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Shimmer</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MeanShimmer</td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">Amplitude perturbation (using mean)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MedianShimmer</italic>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">Amplitude perturbation (using median)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LocalShimmer</td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Average absolute difference between amplitudes of consecutive period</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LocaldbShimmer</td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Average absolute base-10 logarithm of the difference between amplitudes of consecutive period</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Apq3Shimmer</td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">3-point amplitude perturbation quotient</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Apq5Shimmer</td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">5-point amplitude perturbation quotient</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Apq11Shimmer</italic>
                </td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">11-point amplitude perturbation quotient</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>DdaShimmer</italic>
                </td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td colspan="2">Shimmer calculated by difference in differences of amplitude</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>MFCC<sup>c</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>MeanMFCC (0-12)</italic>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">13 features of mean MFCC</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>VariationMFCC (0-12)</italic>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td colspan="2">13 features of mean variation of MFCC</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>RelBandPower (0-3)</italic>
                </td>
                <td colspan="2">Tsanas et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td colspan="2">4 features capturing relative band power in 4 spectrum ranges</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <italic>HNR</italic>
                  <sup>d</sup>
                </td>
                <td colspan="2">Boersma and Weenink [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>Signal-to-noise ratio</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <italic>RPDE</italic>
                  <sup>e</sup>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Pitch estimation uncertainty</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <italic>DFA</italic>
                  <sup>f</sup>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Measure of stochastic self-similarity in turbulent noise</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <italic>PPE</italic>
                  <sup>g</sup>
                </td>
                <td colspan="2">Little et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Measure of inability of maintaining constant pitch</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>We collected the features using the code or methodology described in the corresponding code-source entry.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>The correlated features were removed, and features in italicized text were used to build the models. Feature names are preceded by the loosely defined umbrella category they belong to.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>MFCC: mel-frequency cepstral coefficient.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>HNR: harmonic-to-noise ratio.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>RPDE: recurrence period density entropy.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>DFA: detrended fluctuation analysis.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>PPE: pitch period entropy.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Embedding Features Extraction</title>
        <p>We extracted deep learning–based PASE embeddings [<xref ref-type="bibr" rid="ref27">27</xref>] for our audio files. PASE represents the information contained in a raw audio instance through a list of encoded vectors. To ensure that the encoded vectors contain the same information as the input audio file, it decodes various properties of the audio file, including the audio waveform, log power spectrum, MFCCs, four prosody features (interpolated logarithm of the fundamental frequency, voiced or unvoiced probability, zero-crossing rate, and energy), and local InfoMax, from the encoded vectors. The encoded vectors must retain relevant information about the input audio file to decode all these properties successfully.</p>
        <p>As these properties represent the inherent characteristics of the input audio file rather than any task-specific features, they have been used to solve a host of downstream tasks, such as speech classification, speaker recognition, and emotion recognition. Therefore, we also used them for PD detection.</p>
      </sec>
      <sec>
        <title>Experiments</title>
        <p>For each feature set, we applied a standard set of machine learning algorithms, such as SVM [<xref ref-type="bibr" rid="ref40">40</xref>], XGBoost [<xref ref-type="bibr" rid="ref41">41</xref>], LightGBM [<xref ref-type="bibr" rid="ref42">42</xref>], and random forest [<xref ref-type="bibr" rid="ref43">43</xref>], to classify PD versus non-PD. SVM separates the data into several classes while maintaining the maximum possible margin among the classes. A random forest is built as an ensemble of decision trees; each decision tree builds a tree using a subset of features and learns if-else type decision rules to make a prediction. We also used XGBoost and LightGBM, algorithms based on gradient boosting where they build successively better models by refining the models at hand.</p>
        <p>We used a leave-one-out cross-validation training strategy; using this strategy, one sample of data from the data set is left out, and the other n−1 samples are used to create a model and predict the remaining sample. We used metrics such as binary accuracy and AUC to evaluate our model’s performance. AUC is the area under the receiver operating characteristics (ROC) curve. The ROC curve is constructed by calculating the AUC produced by taking the ratio of the true-positive rate and the false-positive rate while varying the decision threshold. AUC has the highest value of 1, which denotes that the two classes can be separated perfectly, whereas an AUC value of 0.5 indicates that the model cannot distinguish between the two classes. Because our data set was imbalanced, AUC is a much better metric for understanding the true performance of our model. To reduce the effects of data imbalance, we used data augmentation techniques such as the synthetic minority oversampling technique [<xref ref-type="bibr" rid="ref44">44</xref>] and SVM synthetic minority oversampling technique [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
      </sec>
      <sec>
        <title>Model Interpretation Technique</title>
        <p>To interpret the models, we used the Shapley additive explanations (SHAP) technique based on the Shapley value. The Shapley value is a game-theoretic concept of distributing the payouts fairly among players [<xref ref-type="bibr" rid="ref46">46</xref>]. In the machine learning context, each individual feature of an instance can be thought of as a player, and the payout is the difference between an instance’s prediction and the average prediction. We choose SHAP for two reasons: (1) it is well suited for explaining the output of any machine learning model, and (2) it is the only feature attribution method that fulfills the mathematical definition of fairness.</p>
        <p>To use SHAP to explain gradient boosting and tree-based models such as XGBoost, Lundberg et al [<xref ref-type="bibr" rid="ref47">47</xref>] introduced methods to provide a polynomial time model to compute optimized explanations. Their method can generate local interpretations—how the features affect one particular prediction of a data instance—and then combine those local interpretations to make global interpretations about features present in the entire data set. By setting up a class of features to condition on, they traverse the tree in the following manner: if we are traversing on a node that was split based on a feature we are conditioning on, we simply follow the decision path; otherwise, the results from the left and right subtrees originating from the current node are computed recursively, and their results are added through a weighted summation strategy, thus computing the SHAP value for the feature in question.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>The data were preprocessed, and both standard acoustic features (eg, pitch, jitter, shimmer, and MFCC) and deep learning–based audio embedding features, representing an audio clip as a feature vector, were extracted; henceforth, we call these <italic>standard features</italic> and <italic>embedding features</italic>. In the rest of the <italic>Results</italic> section, we discuss the results from the models built on the entire data set, interpretations of the best model on the entire data set, and results and interpretation from specialized models on gender-stratified and age-trimmed data sets.</p>
      </sec>
      <sec>
        <title>Detecting PD From the Entire Data Set</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> contains the AUC and accuracy scores of the four machine learning models trained on the <italic>standard features</italic> and <italic>embedding features</italic> separately. Applying XGBoost on the standard features showed the best performance of 0<italic>.</italic>75 AUC and 0<italic>.</italic>74 accuracy. We also noticed that models trained on <italic>standard features</italic> work better than those trained on <italic>embedding features.</italic></p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Performance on the entire data set. The performance of various machine learning algorithms using the standard and embedding features on a data set combining data from both home and laboratory environments<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="140"/>
            <col width="190"/>
            <col width="150"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td>Algorithm</td>
                <td colspan="2">Standard features</td>
                <td colspan="2">Embedding features</td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>AUC<sup>b</sup></td>
                <td>Accuracy</td>
                <td>AUC</td>
                <td>Accuracy</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>SVM<sup>c</sup></td>
                <td>0.751</td>
                <td>0.735</td>
                <td>0.738</td>
                <td>0.692</td>
              </tr>
              <tr valign="top">
                <td>Random forest</td>
                <td>0.745</td>
                <td>0.720</td>
                <td>0.726</td>
                <td>0.708</td>
              </tr>
              <tr valign="top">
                <td>LightGBM</td>
                <td>0.753</td>
                <td>0.720</td>
                <td>0.737</td>
                <td>0.693</td>
              </tr>
              <tr valign="top">
                <td>XGBoost</td>
                <td>
                  <italic>0.750</italic>
                  <sup>d</sup>
                </td>
                <td>
                  <italic>0.741</italic>
                </td>
                <td>0.722</td>
                <td>0.689</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Models using standard features perform better than the models using embedding features in terms of both binary accuracy and area under the curve. Although the performance of the models is almost similar in terms of area under the curve metric, XGBoost outperforms others by considering both the area under the curve and accuracy metrics simultaneously.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>AUC: area under the curve.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>Variable outperforms all others by taking both area under the curve and accuracy into account.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Model Interpretation</title>
        <p>The goal of SHAP is to explain the model’s prediction of any instance as a sum of contributions from its feature values; if a data instance can be thought of as X<sub>i</sub>=[f<sub>1</sub>, f<sub>2</sub>,...f<sub>N</sub>], SHAP will assign a number to each of these f<sub>j</sub> features, denoting the impact of that feature—both the magnitude and direction—on the model’s prediction. Then, all these local explanations are aggregated to create a global interpretation for the entire data set. A global interpretation is presented in the first part of <xref rid="figure5" ref-type="fig">Figure 5</xref>; the top 10 most impactful features, ranked by having the most impact to the least, are presented. To calculate each feature’s impact, all of its SHAP values across all the data instances are gathered, and then the mean of their absolute values is calculated.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Shapley additive explanations analysis of our best performing models on 3 data sets: (A) main model (ie, entire data set), (B) female model (ie, female only), and (C) age-trimmed model (all subjects are older than 50 years).</p>
          </caption>
          <graphic xlink:href="jmir_v23i10e26305_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Features that have an impact on the model’s performance are typically the spectral features: the mean values or the variation of MFCC in each spectrum range. Apart from that, some other complex features such as recurrence period density entropy (RPDE; a measure of uncertainty in F0 estimation), PPE (a measure of inability to maintain a constant F0), and harmonic-to-noise ratio (HNR) also affected the interpretation presented in the first part of <xref rid="figure5" ref-type="fig">Figure 5</xref>.</p>
      </sec>
      <sec>
        <title>Gender- and Age-Stratified Analysis</title>
        <p>The characteristics of a person’s voice are greatly influenced by age and gender. In <xref rid="figure6" ref-type="fig">Figure 6</xref>, we see that men and women display a changing characteristic in their voices as they get older. Female voices have a higher F0 value, but it decreases with age. Males typically have a higher F0 value in their youth, which decreases with age and then increases roughly after the age of 45 years. Therefore, it can produce confounding effects when analyzing PD from audio, where the machine learning model uses audio features to detect PD. To minimize the effect of confounding factors, researchers trained separate models on data from male and female participants [<xref ref-type="bibr" rid="ref28">28</xref>] or analyzed an age-trimmed data set by considering data from participants older than 50 years [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Changes in fundamental frequency F0 of voice as a function of gender and age (collected from Tsanas et al [<xref ref-type="bibr" rid="ref13">13</xref>]).</p>
          </caption>
          <graphic xlink:href="jmir_v23i10e26305_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Building Specialized Models for Each Gender- and Age-Trimmed Analysis</title>
        <p>The performance metrics of the machine learning models trained on the male, female, and age-trimmed data sets are shown in <xref ref-type="table" rid="table4">Table 4</xref>. By comparing the performance with metrics presented in <xref ref-type="table" rid="table3">Table 3</xref>, we can see that the models that used male- or age-trimmed data sets performed at par or better than the models that used the whole data set to train. However, there was a performance drop in the models using the female data set. <xref ref-type="table" rid="table1">Table 1</xref> shows that females are overrepresented in the non-PD group and underrepresented in the PD group, leading to data imbalance and possibly lowering performance for the female-only model.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Gender- and age-stratified models. Three separate data sets were constructed: a male data set with male participants, a female data set with female participants, and age-trimmed data set by excluding the participants younger than 50 years. For each of these data sets, a separate model was constructed, and its performance is reported below (N=726).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="170"/>
            <col width="80"/>
            <col width="110"/>
            <col width="70"/>
            <col width="110"/>
            <col width="0"/>
            <col width="190"/>
            <col width="270"/>
            <thead>
              <tr valign="top">
                <td>Algorithm</td>
                <td colspan="2">Male (n=415)</td>
                <td colspan="3">Female (n=477)</td>
                <td colspan="2">Age-trimmed (male, n=366 and female, n=426)</td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>AUC<sup>a</sup></td>
                <td>Accuracy</td>
                <td>AUC</td>
                <td>Accuracy</td>
                <td colspan="2">AUC</td>
                <td>Accuracy</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>SVM<sup>b</sup></td>
                <td>0.795</td>
                <td>0.717</td>
                <td>0.659</td>
                <td>0.763</td>
                <td colspan="2">0.755</td>
                <td>0.723</td>
              </tr>
              <tr valign="top">
                <td>Random Forest</td>
                <td>0.758</td>
                <td>0.702</td>
                <td>0.699</td>
                <td>0.788</td>
                <td colspan="2">0.739</td>
                <td>0.713</td>
              </tr>
              <tr valign="top">
                <td>LightGBM</td>
                <td>0.725</td>
                <td>0.665</td>
                <td>0.717</td>
                <td>0.768</td>
                <td colspan="2">0.749</td>
                <td>0.712</td>
              </tr>
              <tr valign="top">
                <td>XGBoost</td>
                <td>0.762</td>
                <td>0.717</td>
                <td>0.682</td>
                <td>0.771</td>
                <td colspan="2">0.742</td>
                <td>0.704</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>AUC: area under the curve.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>SVM: support vector machine.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>We also analyzed the features that drive the performance of these specialized models through SHAP analysis. The second part of <xref rid="figure5" ref-type="fig">Figure 5</xref> shows the most salient features ranked by their SHAP value and the distribution of the impact of each feature on the model’s decision-making. The most important features are still dominated by the MFCC-related features or complex features such as the HNR, relative band power in different frequency ranges (RelBandPower1, RelBandPower3), RPDE (uncertainty in F0 estimation), perturbation in F0 (DdpJitter), or perturbation in amplitude (Apq11Shimmer). However, one noticeable fact is that three-pitch and jitter-related features—MedianPitch (median principal frequency, StdDevPitch (SD in principal frequency) and MedianJitter (median variation in F0)—also affected the model’s prediction, which was not noticed in the SHAP analysis run on the all-data-model.</p>
        <p>Similarly, we interpreted the salient features of the age-trimmed data set in the third part of <xref rid="figure5" ref-type="fig">Figure 5</xref>. We noticed that the most salient features usually come from the MFCC feature groups, complex features (RPDE, PPE, and HNR), relative band power (RelBandPower1, RelBandPower2, and RelBandPower3), and pitch-related features. In addition, the pitch-related features also drove the prediction of the model.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Limitations</title>
        <p>In all of our experiments, we chose leave-one-out cross-validation to maintain uniform experimental settings between different models, data augmentation, and data set combinations because K-fold cross-validation can show high variance in performance based on how stratified the folds are. However, we acknowledge that our choice introduces the problem of overfitting and increases the computational complexity manifold. Therefore, we could not run extensive hyperparameter tuning to improve the performance of our models. By carefully stratifying the folds and maintaining the same fold settings for comparable experimental settings, K-fold cross-validation may enable us to achieve higher performance with lower computational complexity.</p>
        <p>Moreover, our chosen metrics, accuracy and ROC AUC, can be overly optimistic because of the unbalanced nature of our data set. Metrics such as ROC–Precision-Recall balanced accuracy, and more information about sensitivity and specificity may shed more light on how we are performing in the minority class. In the future, we plan to apply other cross-validation techniques and better metrics to conduct our experiments and report our performance.</p>
      </sec>
      <sec>
        <title>Detecting PD From Regular Conversation</title>
        <p>Some of the most common voice disorders induced by PD are dysphonia (distortion or abnormality of voice), dysarthria (problems with speech articulation), and hypophonia (reduced voice volume). Two speech-related diagnostic tasks are commonly used to detect PD by exploiting the changing vocal pattern caused by these disorders: (1) sustained phonation (the participant is supposed to utter a single vowel for a long time with constant pitch) and (2) running speech (the participant speaks a standard sentence). Little et al [<xref ref-type="bibr" rid="ref12">12</xref>] developed features for detecting dysphonia in patients with PD. Tsanas et al [<xref ref-type="bibr" rid="ref25">25</xref>] focused on the telemonitoring of self-administered sustained vowel phonation task to predict the Unified Parkinson’s Disease Rating Scale rating (on Rating Scales for Parkinson’s Disease 2003), a commonly used indicator for quantifying PD symptoms. These studies trained their models with data captured by sophisticated devices (eg, wearable devices, high-resolution video recorder, and the Intel at-home–testing-device telemonitoring system) that are often not accessible to all and are difficult to scale. The performance of these models can be significantly reduced when classifying data collected in home acoustics. In addition, correctly completing the sustained phonation task requires following a specific set of guidelines, such as completing the task in one breath, which can be difficult for older individuals.</p>
        <p>In contrast, we analyzed the running speech task from the data collected by using a web-based data collection platform that can be accessed by anyone anywhere in the world and requires only an internet-connected device with an integrated camera and microphone. In addition, the running speech task does not require conforming to specific instructions and is more similar to regular conversation; therefore, the model can be potentially augmented to predict PD from a regular conversation—a potential game-changer in PD assessment. In the future, user-consented plug-ins could be developed for apps such as Alexa, Google Home, or Zoom, where audio is transmitted between persons. Anyone who consents to download the plug-in and uses it while on the phone, over Zoom, or giving virtual or in-person presentations could benefit from receiving an informal referral to see a neurologist, when appropriate. The plug-in would not store the participants’ data unless they opt to build a personalized profile to ensure privacy and ethical usage of our framework.</p>
      </sec>
      <sec>
        <title>Validating Model Interpretation</title>
        <p>The features that SHAP found to have an impact on modeling decisions are well supported by previous research. For example, MFCC features have already proven to be useful in a wide range of audio tasks such as speaker recognition [<xref ref-type="bibr" rid="ref48">48</xref>], music information retrieval [<xref ref-type="bibr" rid="ref38">38</xref>], voice activity detection [<xref ref-type="bibr" rid="ref49">49</xref>], and most importantly, in voice quality assessment [<xref ref-type="bibr" rid="ref50">50</xref>]. Similarly, the high impact of the HNR and the measures of uncertainty in F0 estimation (RPDE) and inability to maintain a constant F0 (PPE) on the model’s output are in congruence with the findings from Little et al [<xref ref-type="bibr" rid="ref12">12</xref>]. However, explaining the first part of <xref rid="figure5" ref-type="fig">Figure 5</xref> in light of PD-induced vocal impairment is a difficult task. MFCC features are calculated by converting the audio signal into the frequency domain, and they denote how energy in the signal is distributed within various frequency ranges. Therefore, providing a physical interpretation of the SHAP values corresponding to the MFCC features is not straightforward. Similarly, Little et al [<xref ref-type="bibr" rid="ref12">12</xref>] designed the RPDE and PPE features to model a sustained phonation task (uttering “ahh”) with the assumption that healthy participants will be able to maintain a smooth and regular voice pattern. In contrast, uttering multiple sentences introduces considerable variation in the data, adding a wide set of heterogeneous patterns. Therefore, the underlying assumptions behind constructing these features do not hold for our task of uttering multiple sentences.</p>
        <p>We conduct an empirical validation of the SHAP output shown in the first part of <xref rid="figure5" ref-type="fig">Figure 5</xref>. We incrementally add one feature at a time to build a dynamic feature set, train successive models on that feature set, and report the accuracy and AUC performances. We see that the performance of our model saturates after adding 7 to 8 features. Therefore, we can say that the SHAP analysis teases out the most important features driving the model’s performance successfully.</p>
      </sec>
      <sec>
        <title>Why Not Stratified Analysis Only?</title>
        <p>We built models inclusive of all genders for several reasons. First, there are potential shared characteristics among vocal patterns of all genders that can be relevant for detecting PD. Second, dividing the data set into two portions reduces the available training data for each model, which may, in turn, reduce the generalization capability of each model. In addition, our model analyzes data from patients of all ages. Although most people diagnosed with PD are older than 60 years, approximately 10% to 20% of the population diagnosed with PD are younger than 50 years, and approximately half of them are younger than 40 years [<xref ref-type="bibr" rid="ref51">51</xref>]. As anecdotal evidence, Michael J Fox was diagnosed with PD at the age of 29 years [<xref ref-type="bibr" rid="ref52">52</xref>], and Muhammad Ali had PD by 42 years [<xref ref-type="bibr" rid="ref53">53</xref>]. In our data set, there were also a minority of patients with PD who were younger than 50 years (<xref rid="figure4" ref-type="fig">Figure 4</xref>). On the basis of these observations, we believe that our system should provide access to all people, irrespective of age. PD does not discriminate by age while affecting a person, and an automated system should not discriminate based on age and provide equitable services to people of all ages. However, these factors can function as confounders in PD analysis. Therefore, we provided additional analysis to ensure that our model does not use the idiosyncrasies of group-specific information to make predictions.</p>
      </sec>
      <sec>
        <title>Performance Excluding Laboratory Environment Data</title>
        <p>When the data were collected in the laboratory, participants had access to a clinician providing support using a consistent recording setup and dedicated bandwidth. In contrast, the data collected in the home setting involved no assistance and included the real-world variability of heterogeneous recording setups and inconsistent internet speed. In theory, the data collected at the <italic>laboratory</italic> and <italic>home</italic> were very different from each other.</p>
        <p>To ensure that our model works equally well without the <italic>clean lab data</italic>, we designed two experiments. In experiment 1, we removed clean lab data, which was approximately 7.4% (54/726) of the entire data set, retrained our model on the remaining 672 participants using the leave-one-out validation procedure, and calculated the performance metrics. In experiment 2, we randomly removed 7% (roughly 54 data points) of <italic>home</italic> data from the entire data set (while keeping the <italic>lab</italic> data intact), building a model with the remaining 93% data with the leave-one-out cross-validation method. Then, we conducted experiment 2 10 times and calculated the <italic>average</italic> performance from these 10 runs. We found that the AUC metric across these three experiments was fairly consistent, with a very small 0.015 decrease in AUC when removing lab data, demonstrating that our framework performs equally well across the <italic>lab</italic> and <italic>home</italic> data.</p>
      </sec>
      <sec>
        <title>Label Inconsistency and Predicting Tremor Score</title>
        <p>Using the PARK [<xref ref-type="bibr" rid="ref29">29</xref>] protocol, we collected one of the largest data sets of participants conducting a series of motor, facial expression, and speech tasks following the MDS-UPDRS PD assessment protocol [<xref ref-type="bibr" rid="ref3">3</xref>]. Although we analyzed only the speech task in this study, the data set can be potentially used to automate the assessment of a large set of MDS-UPDRS tasks and facilitate early-stage PD detection, thus improving the quality of life for millions of people worldwide. However, deploying the data collection protocol on the web and facilitating access to anyone anywhere around the world comes at a cost. To date, all of our participants with PD have been clinically verified to be diagnosed with PD. Therefore, the labels of the PD data points are reliable. However, the participants without PD did not undergo clinical verification. Our data collection protocol asked them appropriate questions to check whether they had been diagnosed with PD and collected data when they answered in the negative. However, we cannot discount the possibility that a small subset of our population without PD is in the very early stage of PD and is oblivious about it. At present, there are estimated to be around 1 million patients with PD in the United States, out of a population of 330 million [<xref ref-type="bibr" rid="ref51">51</xref>], yielding a PD prevalence rate of 0.3%. However, as our non-PD data set was largely tilted toward people older than 50 years, the rate in our data set could be higher than 0.3%. Even if we consider a liberal 1% prevalence rate, the number of individuals with undiagnosed PD in our control population is likely low (at most 4.6 persons). Therefore, we believe that the non-PD data labels are generally reliable. In the future, we plan to model tremor score in (0-4 range for each task; 0 for no tremor, and 4 for severe tremor) instead of a binary label following the MDS-UPDRS protocol to address this problem more thoroughly.</p>
      </sec>
      <sec>
        <title>Building a More Representative Data Set</title>
        <p>The PARK protocol is web enabled, allowing anyone with access to the internet to contribute data. We plan to augment our data set by adding more non–native English speakers, females, and participants with PD. As our PD data are collected through contacts from local PD clinics and non-PD data through Amazon Mechanical Turk, most of our participants were from the United States or other English-speaking countries. To make our model more robust on data from non–native English speakers, we are in process of collecting both PD and non-PD data from non–native English-speaking countries. In addition, our current protocol can collect data from people with computer and internet access only, and therefore, it can potentially exclude underserved people. In the future, we plan to build desktop and mobile apps that can collect data offline to build a more inclusive framework.</p>
        <p>Our best model for female data performed worse than its male counterparts, as shown in <xref ref-type="table" rid="table4">Table 4</xref>. We attribute this degraded performance PD or non-PD imbalance for female participants in our data set: the PD-to-non-PD ratio for females was 101 out of 300 (<xref ref-type="table" rid="table1">Table 1</xref>). Previous epidemiological studies have shown that both the incidence and prevalence of PD are 1.5 to 2 times higher in men than in women [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. Therefore, any randomly sampled data set for PD will have a higher prevalence of males, contributing to models that are more biased toward males. Our immediate plan is to prioritize collecting balanced data from all genders, ages, and races across geographical boundaries, leading to a balanced data set.</p>
        <p>Our data set also has the ubiquitous problem of data imbalance in diagnostic tests: the amount of data from participants without PD is 1.8 times more than their PD counterparts. Therefore, there is a risk that the model will be biased toward predicting the majority non-PD class as default and yield a high false-negative score. To address this, we plan to recruit more participants with PD in the future to make our data set more balanced. Another potential approach is to run the analysis on a subset of the data set produced by conducting proper age, gender, and matching of patients with and without PD.</p>
        <p>As shown in <xref ref-type="table" rid="table1">Table 1</xref>, our participants with PD were diagnosed 7<italic>.</italic>88 (SD 5<italic>.</italic>41) years ago. Owing to limited data availability, we did not conduct an analysis on early-stage PD prediction. In the future, we plan to include more participants in the early stages of PD and build models that can detect them. We will especially focus on recruiting participants with PD in the age range of 20 to 40 years to analyze the very early-stage onset of PD among young adults. Furthermore, we plan to collect and analyze multiple speech instances from each person to reduce person-specific variability and obtain a more holistic view of their PD state.</p>
      </sec>
      <sec>
        <title>Increasing Model Performance</title>
        <p>Although we consider AUC to be a better metric for our data set, our model performs 10% better than always choosing non-PD as the prediction in terms of binary accuracy. To be practically deployable in clinical settings, the performance needs to be improved further. We will focus on four promising avenues: making the data set balanced, designing better features capable of modeling the nuanced pattern in our data, making our model resilient to noise present in our data, and deconfounding the PD prediction from age and gender variables.</p>
        <p>To remove noise, we plan to augment the techniques proposed in Poorjam et al [<xref ref-type="bibr" rid="ref56">56</xref>] to automatically enhance our data quality by detecting the segments of data that conform to our experimental design. Moreover, as discussed above, gender and age can appear as confounding variables in the PD prediction task. In this paper, we have shown that our unified model and stratified sex-specific models have similar performance. However, we plan to build better models to systematically deconfound the effects of both age and gender variables while benefiting from them simultaneously. We can achieve this by incorporating the causal bootstrapping technique—a resampling method that considers the causal relationship between variables and negates the effect of spurious, indirect interactions, as outlined by Little and Badawy [<xref ref-type="bibr" rid="ref57">57</xref>].</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Description of the features.</p>
        <media xlink:href="jmir_v23i10e26305_app1.docx" xlink:title="DOCX File , 20 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">HNR</term>
          <def>
            <p>harmonic-to-noise ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">MDS-UPDRS</term>
          <def>
            <p>Movement Disorder Society-Unified Parkinson’s Disease Rating Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MFCC</term>
          <def>
            <p>mel-frequency cepstral coefficient</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">P2FA</term>
          <def>
            <p>Penn Phonetics Lab Forced Aligner Toolkit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PARK</term>
          <def>
            <p>Parkinson’s Analysis with Remote Kinetic-tasks</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PASE</term>
          <def>
            <p>problem agnostic speech encoder</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">PD</term>
          <def>
            <p>Parkinson disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">PPE</term>
          <def>
            <p>pitch period entropy</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ROC</term>
          <def>
            <p>receiver operating characteristics</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">RPDE</term>
          <def>
            <p>recurrence period density entropy</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">SHAP</term>
          <def>
            <p>Shapley additive explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was funded by the National Institute of Neurological Disorders and Stroke of the National Institutes of Health under award number P50NS108676.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>WR, SL, MSI, and VNA worked in data analysis, feature extraction, model training, model interpretation, and manuscript preparation. HR, AAM, EW, and SJR helped build, maintain, and coordinate the data collection procedure. MRA, MAL, and RD helped improve the manuscript; suggested important experiments; and provided access to critical resources such as code and data. All the other authors helped in data collection. EH was the principal investigator of the project; he facilitated the entire project and helped shape the narrative of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khadilkar</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Neurology in India</article-title>
          <source>Ann Indian Acad Neurol</source>
          <year>2013</year>
          <month>10</month>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>465</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.annalsofian.org/article.asp?issn=0972-2327;year=2013;volume=16;issue=4;spage=465;epage=466;aulast=Khadilkar"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/0972-2327.120415</pub-id>
          <pub-id pub-id-type="medline">24339561</pub-id>
          <pub-id pub-id-type="pii">AIAN-16-465</pub-id>
          <pub-id pub-id-type="pmcid">PMC3841582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Howlett</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>Neurology in Africa</article-title>
          <source>Neurology</source>
          <year>2014</year>
          <month>08</month>
          <day>11</day>
          <volume>83</volume>
          <issue>7</issue>
          <fpage>654</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1212/wnl.0000000000000682</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goetz</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Tilley</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Shaftman</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Stebbins</surname>
              <given-names>GT</given-names>
            </name>
            <name name-style="western">
              <surname>Fahn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez-Martin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Poewe</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sampaio</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Stern</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Dodel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubois</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Holloway</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jankovic</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kulisevsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Lees</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Leurgans</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>LeWitt</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Nyenhuis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Olanow</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Rascol</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Schrag</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Teresi</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>van Hilten</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>LaPelle</surname>
              <given-names>N</given-names>
            </name>
            <collab>Movement Disorder Society UPDRS Revision Task Force</collab>
          </person-group>
          <article-title>Movement Disorder Society-sponsored revision of the Unified Parkinson's Disease Rating Scale (MDS-UPDRS): scale presentation and clinimetric testing results</article-title>
          <source>Mov Disord</source>
          <year>2008</year>
          <month>11</month>
          <day>15</day>
          <volume>23</volume>
          <issue>15</issue>
          <fpage>2129</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1002/mds.22340</pub-id>
          <pub-id pub-id-type="medline">19025984</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dorsey</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hoque</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>McDuff</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Spatio-temporal attention and magnification for classification of Parkinson’s disease from videos collected via the internet</article-title>
          <source>Proceedings of the 15th IEEE International Conference on Automatic Face and Gesture Recognition (FG 2020)</source>
          <year>2020</year>
          <conf-name>15th IEEE International Conference on Automatic Face and Gesture Recognition (FG 2020)</conf-name>
          <conf-date>November 16-20, 2020</conf-date>
          <conf-loc>Buenos Aires, Argentina</conf-loc>
          <pub-id pub-id-type="doi">10.1109/fg47880.2020.00008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lonini</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shawen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Simuni</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Poon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shimanovich</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Daeschler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghaffari</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Jayaraman</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Wearable sensors for Parkinson's disease: which data are worth collecting for training symptom detection models</article-title>
          <source>NPJ Digit Med</source>
          <year>2018</year>
          <month>11</month>
          <day>23</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>64</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-018-0071-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-018-0071-z</pub-id>
          <pub-id pub-id-type="medline">31304341</pub-id>
          <pub-id pub-id-type="pii">71</pub-id>
          <pub-id pub-id-type="pmcid">PMC6550186</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bandini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giovannelli</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Orlandi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Barbagallo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cincotta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vanni</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chiaramonti</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Borgheresi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zaccara</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Manfredi</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Automatic identification of dysprosody in idiopathic Parkinson's disease</article-title>
          <source>Biomed Signal Process Control</source>
          <year>2015</year>
          <month>03</month>
          <volume>17</volume>
          <fpage>47</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1016/j.bspc.2014.07.006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Iansek</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Marigliani</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bradshaw</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Gates</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Speech impairment in a large sample of patients with Parkinson’s disease</article-title>
          <source>Behav Neurol</source>
          <year>1999</year>
          <volume>11</volume>
          <issue>3</issue>
          <fpage>131</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1155/1999/327643</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Logemann</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>HB</given-names>
            </name>
            <name name-style="western">
              <surname>Boshes</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Blonsky</surname>
              <given-names>ER</given-names>
            </name>
          </person-group>
          <article-title>Frequency and cooccurrence of vocal tract dysfunctions in the speech of a large sample of Parkinson patients</article-title>
          <source>J Speech Hear Disord</source>
          <year>1978</year>
          <month>02</month>
          <volume>43</volume>
          <issue>1</issue>
          <fpage>47</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.1044/jshd.4301.47</pub-id>
          <pub-id pub-id-type="medline">633872</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Duffy</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Motor Speech Disorders E-Book: Substrates, Differential Diagnosis, and Management. 4th Edition</source>
          <year>2019</year>
          <publisher-loc>Amsterdam</publisher-loc>
          <publisher-name>Elsevier</publisher-name>
          <fpage>201</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arora</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Venkataraman</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Zhan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Donohue</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Biglan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dorsey</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Detecting and monitoring the symptoms of Parkinson's disease using smartphones: A pilot study</article-title>
          <source>Parkinsonism Relat Disord</source>
          <year>2015</year>
          <month>06</month>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>650</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1016/j.parkreldis.2015.02.026</pub-id>
          <pub-id pub-id-type="medline">25819808</pub-id>
          <pub-id pub-id-type="pii">S1353-8020(15)00081-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Playfer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hindle</surname>
              <given-names>JV</given-names>
            </name>
          </person-group>
          <source>Parkinson's Disease in the Older Patient</source>
          <year>2008</year>
          <publisher-loc>London</publisher-loc>
          <publisher-name>CRC Press</publisher-name>
          <fpage>1</fpage>
          <lpage>432</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Little</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hunter</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Spielman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Suitability of dysphonia measurements for telemonitoring of Parkinson’s disease</article-title>
          <source>Nat Prec</source>
          <year>2008</year>
          <month>09</month>
          <day>12</day>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.1038/npre.2008.2298.1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Accurate telemonitoring of Parkinson’s disease symptom severity using nonlinear speech signal processing and statistical machine learning</article-title>
          <source>Doctoral Dissertation, Oxford University, UK</source>
          <year>2012</year>
          <access-date>2021-09-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ora.ox.ac.uk/objects/uuid:2a43b92a-9cd5-4646-8f0f-81dbe2ba9d74">https://ora.ox.ac.uk/objects/uuid:2a43b92a-9cd5-4646-8f0f-81dbe2ba9d74</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Delen</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Computer-aided diagnosis of parkinson's disease using complex-valued neural networks and mrmr feature selection algorithm</article-title>
          <source>J Healthc Eng</source>
          <year>2015</year>
          <month>08</month>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>281</fpage>
          <lpage>302</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1260/2040-2295.6.3.281"/>
          </comment>
          <pub-id pub-id-type="doi">10.1260/2040-2295.6.3.281</pub-id>
          <pub-id pub-id-type="medline">26753436</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rueda</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnan</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Feature analysis of dysphonia speech for monitoring Parkinson’s disease</article-title>
          <source>Proceedings of the 39th Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)</source>
          <year>2017</year>
          <conf-name>39th Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)</conf-name>
          <conf-date>July 11-15, 2017</conf-date>
          <conf-loc>Jeju, Korea (South)</conf-loc>
          <fpage>2308</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1109/embc.2017.8037317</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wroge</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Özkanca</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Demiroglu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Si</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Atkins</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ghomi</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Parkinson’s disease diagnosis using machine learning and voice</article-title>
          <source>Proceedings of the IEEE Signal Processing in Medicine and Biology Symposium (SPMB)</source>
          <year>2018</year>
          <conf-name>IEEE Signal Processing in Medicine and Biology Symposium (SPMB)</conf-name>
          <conf-date>Dec. 1, 2018</conf-date>
          <conf-loc>Philadelphia, PA, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/spmb.2018.8615607</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaiciukynas</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gelzinis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Verikas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bacauskiene</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Parkinson’s disease detection from speech using convolutional neural networks</article-title>
          <source>Proceedings of the International Conference on Smart Objects and Technologies for Social Good</source>
          <year>2017</year>
          <conf-name>International Conference on Smart Objects and Technologies for Social Good</conf-name>
          <conf-date>November 29-30, 2017</conf-date>
          <conf-loc>Pisa, Italy</conf-loc>
          <fpage>206</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-76111-4_21</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vásquez-Correa</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Orozco-Arroyave</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bocklet</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nöth</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Towards an automatic evaluation of the dysarthria level of patients with Parkinson's disease</article-title>
          <source>J Commun Disord</source>
          <year>2018</year>
          <month>11</month>
          <volume>76</volume>
          <fpage>21</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jcomdis.2018.08.002</pub-id>
          <pub-id pub-id-type="medline">30149241</pub-id>
          <pub-id pub-id-type="pii">S0021-9924(17)30076-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dubey</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Abtahi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mahler</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mankodiya</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>EchoWear: smartwatch technology for voice and speech treatments of patients with Parkinson’s disease</article-title>
          <source>Proceedings of the Conference on Wireless Health</source>
          <year>2015</year>
          <conf-name>WH '15: Wireless Health 2015 Conference</conf-name>
          <conf-date>October 14 - 16, 2015</conf-date>
          <conf-loc>Bethesda Maryland</conf-loc>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1145/2811780.2811957</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vásquez-Correa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Arias-Vergara</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Orozco-Arroyave</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vargas-Bonilla</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Arias-Londoño</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nöth</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Automatic detection of Parkinson’s disease from continuous speech recorded in non-controlled noise conditions</article-title>
          <source>Proceedings of the Sixth Annual Conferecence on International Speech Communication Association</source>
          <year>2015</year>
          <conf-name>Sixth Annual Conferecence on International Speech Communication Association</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Dresden, Germany</conf-loc>
          <pub-id pub-id-type="doi">10.21437/interspeech.2016-1122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An efficient hybrid kernel extreme learning machine approach for early diagnosis of Parkinson׳s disease</article-title>
          <source>Neurocomputing</source>
          <year>2016</year>
          <month>04</month>
          <volume>184</volume>
          <fpage>131</fpage>
          <lpage>44</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2015.07.138</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <source>Park Test</source>
          <access-date>2020-09-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://parktest.net/">https://parktest.net/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kubota</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for large-scale wearable sensor data in Parkinson's disease: Concepts, promises, pitfalls, and futures</article-title>
          <source>Mov Disord</source>
          <year>2016</year>
          <month>09</month>
          <volume>31</volume>
          <issue>9</issue>
          <fpage>1314</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1002/mds.26693</pub-id>
          <pub-id pub-id-type="medline">27501026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rahul</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Katabi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>BodyCompass:Monitoring Sleep Posture with Wireless Signals</article-title>
          <source>Proceedings of the ACM on Interactive, Mobile, Wearable and Ubiquitous Technologies</source>
          <year>2020</year>
          <month>06</month>
          <day>15</day>
          <conf-name>ACM on Interactive, Mobile, Wearable and Ubiquitous Technologies</conf-name>
          <conf-date>June 15, 2020</conf-date>
          <conf-loc>New York, USA</conf-loc>
          <fpage>1</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1145/3397311</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Accurate telemonitoring of Parkinson's disease progression by noninvasive speech tests</article-title>
          <source>IEEE Trans Biomed Eng</source>
          <year>2010</year>
          <month>04</month>
          <volume>57</volume>
          <issue>4</issue>
          <fpage>884</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1109/tbme.2009.2036000</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <article-title>Mobile fact sheet</article-title>
          <source>Pew Research Center,  Internet &#38; Technology</source>
          <year>2019</year>
          <access-date>2021-09-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pewresearch.org/internet/fact-sheet/mobile/">https://www.pewresearch.org/internet/fact-sheet/mobile/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pascual</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ravanelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Serrà</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bonafonte</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Learning problem-agnostic speech representations from multiple self-supervised tasks</article-title>
          <source>Proceedings of the Annual Conference on Internatioal Speech Communication Association - INTERSPEECH International</source>
          <year>2019</year>
          <conf-name>Annual Conference on Internatioal Speech Communication Association - INTERSPEECH International</conf-name>
          <conf-date>Apr 6, 2019</conf-date>
          <conf-loc>Graz, Austria</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1904.03416"/>
          </comment>
          <pub-id pub-id-type="doi">10.21437/interspeech.2019-2605</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Using the cellular mobile telephone network to remotely monitor Parkinson's disease symptom severity</article-title>
          <source>Semantic Scholar</source>
          <access-date>2021-09-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/Using-the-cellular-mobile-telephone-network-to-%E2%80%9F-s-Tsanas-Little/17180d351b33f13f7fe681ddf8411cf6aad74b64">https://www.semanticscholar.org/paper/Using-the-cellular-mobile-telephone-network-to-%E2%80%9F-s-Tsanas-Little/17180d351b33f13f7fe681ddf8411cf6aad74b64</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Langevin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Snyder</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dorsey</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Hoque</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>The PARK Framework for automated analysis of Parkinson's disease characteristics</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2019</year>
          <month>06</month>
          <day>21</day>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.1145/3328925</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <article-title>Penn Phonetics Lab Forced Aligner Toolkit (P2FA) for Python3</article-title>
          <source>GitHub</source>
          <access-date>2021-09-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/jaekookang/p2fa_py3">https://github.com/jaekookang/p2fa_py3</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <source>HTK Speech Recognition Toolkit</source>
          <access-date>2021-09-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://htk.eng.cam.ac.uk/">http://htk.eng.cam.ac.uk/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liberman</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Speaker identification on the SCOTUS corpus</article-title>
          <source>J Acoust Soc Am</source>
          <year>2008</year>
          <month>05</month>
          <volume>123</volume>
          <issue>5</issue>
          <fpage>3878</fpage>
          <pub-id pub-id-type="doi">10.1121/1.2935783</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moltu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Stefansen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Svisdahl</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Veseth</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Negotiating the coresearcher mandate - service users' experiences of doing collaborative research on mental health</article-title>
          <source>Disabil Rehabil</source>
          <year>2012</year>
          <volume>34</volume>
          <issue>19</issue>
          <fpage>1608</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.3109/09638288.2012.656792</pub-id>
          <pub-id pub-id-type="medline">22489612</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jadoul</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>de Boer</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Introducing Parselmouth: A Python interface to Praat</article-title>
          <source>J Phonetics</source>
          <year>2018</year>
          <month>11</month>
          <volume>71</volume>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.wocn.2018.07.001"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.wocn.2018.07.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <article-title>Robust parsimonious selection of dysphonia measures for telemonitoring of Parkinson's disease symptom severity</article-title>
          <source>Semantic Scholar</source>
          <access-date>2019-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/Robust-parsimonious-selection-of-dysphonia-measures-Tsanas-Little/43b91147f0b5ab900b29ea7943d58fe761f0e26b">https://www.semanticscholar.org/paper/Robust-parsimonious-selection-of-dysphonia-measures-Tsanas-Little/43b91147f0b5ab900b29ea7943d58fe761f0e26b</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Costello</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Moroz</surname>
              <given-names>IM</given-names>
            </name>
          </person-group>
          <article-title>Exploiting nonlinear recurrence and fractal scaling properties for voice disorder detection</article-title>
          <source>BioMed Eng OnLine</source>
          <year>2007</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>23</fpage>
          <pub-id pub-id-type="doi">10.1186/1475-925x-6-23</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goldberger</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>A Course in Econometrics</source>
          <year>1991</year>
          <publisher-loc>Cambridge, MA</publisher-loc>
          <publisher-name>Harvard University Press</publisher-name>
          <fpage>1</fpage>
          <lpage>426</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Information Retrieval for Music and Motion</source>
          <year>2007</year>
          <publisher-loc>Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Spielman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>LO</given-names>
            </name>
          </person-group>
          <article-title>Novel speech signal processing algorithms for high-accuracy classification of Parkinson's disease</article-title>
          <source>IEEE Trans Biomed Eng</source>
          <year>2012</year>
          <month>05</month>
          <volume>59</volume>
          <issue>5</issue>
          <fpage>1264</fpage>
          <lpage>71</lpage>
          <pub-id pub-id-type="doi">10.1109/tbme.2012.2183367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cortes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vapnik</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Support-vector networks</article-title>
          <source>Mach Learn</source>
          <year>1995</year>
          <month>9</month>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>273</fpage>
          <lpage>97</lpage>
          <pub-id pub-id-type="doi">10.1007/bf00994018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Xgboost: A scalable tree boosting system</article-title>
          <source>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2016</year>
          <conf-name>KDD '16: The 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 13 - 17, 2016</conf-date>
          <conf-loc>San Francisco California</conf-loc>
          <fpage>785</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Finley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>TY</given-names>
            </name>
          </person-group>
          <article-title>Lightgbm: A highly efficient gradient boosting decision tree</article-title>
          <source>Adv Neural Inf Process Syst</source>
          <year>2017</year>
          <fpage>3154</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/LightGBM%3A-A-Highly-Efficient-Gradient-Boosting-Tree-Ke-Meng/497e4b08279d69513e4d2313a7fd9a55dfb73273"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Random decision forests</article-title>
          <source>Proceedings of 3rd International Conference on Document Analysis and Recognition</source>
          <year>1995</year>
          <conf-name>3rd International Conference on Document Analysis and Recognition</conf-name>
          <conf-date>Aug. 14-16, 1995</conf-date>
          <conf-loc>Montreal, QC, Canada</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icdar.1995.598994</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: Synthetic minority over-sampling technique</article-title>
          <source>J Artif Intell Res</source>
          <year>2002</year>
          <month>06</month>
          <day>01</day>
          <volume>16</volume>
          <fpage>321</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Kamei</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Borderline over-sampling for imbalanced data classification</article-title>
          <source>Int J Knowl Eng Soft Data Paradig Inderscience Publishers</source>
          <year>2011</year>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>4</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1504/ijkesdp.2011.039875</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shapley</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A value for n-person games</article-title>
          <source>Contrib Theory Games</source>
          <year>1953</year>
          <volume>2</volume>
          <issue>28</issue>
          <fpage>307</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1017/cbo9780511528446.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Erion</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>DeGrave</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Prutkin</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Nair</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Himmelfarb</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bansal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>From local explanations to global understanding with explainable AI for trees</article-title>
          <source>Nat Mach Intell</source>
          <year>2020</year>
          <month>01</month>
          <day>17</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>56</fpage>
          <lpage>67</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32607472"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s42256-019-0138-9</pub-id>
          <pub-id pub-id-type="medline">32607472</pub-id>
          <pub-id pub-id-type="pmcid">PMC7326367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhattarai</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Prasad</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Alsadoon</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pham</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Elchouemi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Experiments on the MFCC application in speaker recognition using Matlab</article-title>
          <source>Seventh International Conference on Information Science and Technology (ICIST)</source>
          <year>2017</year>
          <conf-name>Seventh International Conference on Information Science and Technology (ICIST)</conf-name>
          <conf-date>April 16-19, 2017</conf-date>
          <conf-loc>Da Nang, Vietnam</conf-loc>
          <fpage>32</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1109/icist.2017.7926796</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kinnunen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chernenko</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tuononen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fränti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Voice activity detection using MFCC features and support vector machine</article-title>
          <source>Proceedings of the International Conference Speech and Computer (SPECOM07)</source>
          <year>2007</year>
          <conf-name>International Conference Speech and Computer (SPECOM07)</conf-name>
          <conf-date>2007</conf-date>
          <conf-loc>Moscow, Russia</conf-loc>
          <fpage>556</fpage>
          <lpage>61</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cs.uef.fi/sipu/pub/svm-vad-SPECOM07.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsanas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>McSharry</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Ramig</surname>
              <given-names>LO</given-names>
            </name>
          </person-group>
          <article-title>Nonlinear speech analysis algorithms mapped to a standard metric achieve clinically useful quantification of average Parkinson's disease symptom severity</article-title>
          <source>J R Soc Interface</source>
          <year>2011</year>
          <month>06</month>
          <day>06</day>
          <volume>8</volume>
          <issue>59</issue>
          <fpage>842</fpage>
          <lpage>55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21084338"/>
          </comment>
          <pub-id pub-id-type="doi">10.1098/rsif.2010.0456</pub-id>
          <pub-id pub-id-type="medline">21084338</pub-id>
          <pub-id pub-id-type="pii">rsif.2010.0456</pub-id>
          <pub-id pub-id-type="pmcid">PMC3104343</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kinnunen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chernenko</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tuononen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fränti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Voice activity detection using MFCC features and support vector machine</article-title>
          <source>Proceedings of the International Conference Speech and Computer (SPECOM07)</source>
          <year>2007</year>
          <conf-name>International Conference Speech and Computer (SPECOM07)</conf-name>
          <conf-date>2007</conf-date>
          <conf-loc>Moscow, Russia</conf-loc>
          <fpage>556</fpage>
          <lpage>61</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cs.uef.fi/sipu/pub/svm-vad-SPECOM07.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <article-title>Michael's Story</article-title>
          <source>Michael J Fox</source>
          <access-date>2021-09-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.michaeljfox.org/michaels-story">https://www.michaeljfox.org/michaels-story</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McCallum</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Muhammad Ali’s advocacy for Parkinson’s disease endures with boxing legacy</article-title>
          <source>Parkinson’s News Today</source>
          <year>2016</year>
          <access-date>2021-09-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://parkinsonsnewstoday.com/2016/06/10/muhammad-alis-advocacy-parkinsons-disease-endures-boxing-legacy/">https://parkinsonsnewstoday.com/2016/06/10/muhammad-alis-advocacy-parkinsons-disease-endures-boxing-legacy/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Den Eeden</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Tanner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fross</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Leimpeter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bloch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Incidence of Parkinson's disease: variation by age, gender, and race/ethnicity</article-title>
          <source>Am J Epidemiol</source>
          <year>2003</year>
          <month>06</month>
          <day>01</day>
          <volume>157</volume>
          <issue>11</issue>
          <fpage>1015</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.1093/aje/kwg068</pub-id>
          <pub-id pub-id-type="medline">12777365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haaxma</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Bloem</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Borm</surname>
              <given-names>GF</given-names>
            </name>
            <name name-style="western">
              <surname>Oyen</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Leenders</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Eshuis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Booij</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dluzen</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Horstink</surname>
              <given-names>MW</given-names>
            </name>
          </person-group>
          <article-title>Gender differences in Parkinson's disease</article-title>
          <source>J Neurol Neurosurg Psychiatry</source>
          <year>2007</year>
          <month>08</month>
          <day>01</day>
          <volume>78</volume>
          <issue>8</issue>
          <fpage>819</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17098842"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jnnp.2006.103788</pub-id>
          <pub-id pub-id-type="medline">17098842</pub-id>
          <pub-id pub-id-type="pii">jnnp.2006.103788</pub-id>
          <pub-id pub-id-type="pmcid">PMC2117736</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Poorjam</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Kavalekalam</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Raykov</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Little</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Christensen</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>Automatic quality control and enhancement for voice-based remote Parkinson’s disease detection</article-title>
          <source>Speech Commun</source>
          <year>2021</year>
          <month>03</month>
          <volume>127</volume>
          <fpage>1</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.1016/j.specom.2020.12.007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Little</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Badawy</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Causal bootstrapping</article-title>
          <source>arXiv</source>
          <year>2019</year>
          <access-date>2021-09-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1910.09648">https://arxiv.org/abs/1910.09648</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
