<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Biomed Eng</journal-id><journal-id journal-id-type="publisher-id">biomedeng</journal-id><journal-id journal-id-type="index">24</journal-id><journal-title>JMIR Biomedical Engineering</journal-title><abbrev-journal-title>JMIR Biomed Eng</abbrev-journal-title><issn pub-type="epub">2561-3278</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v10i1e64357</article-id><article-id pub-id-type="doi">10.2196/64357</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Optimizing Voice Sample Quantity and Recording Settings for the Prediction of Type 2 Diabetes Mellitus: Retrospective Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Assadi</surname><given-names>Atousa</given-names></name><degrees>MSc, MEng</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Oreskovic</surname><given-names>Jessica</given-names></name><degrees>MAS</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kaufman</surname><given-names>Jaycee</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Fossat</surname><given-names>Yan</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff id="aff1"><institution>Klick Applied Sciences</institution><addr-line>175 Bloor St East, North Tower, 3rd floor</addr-line><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Rizvi</surname><given-names>Syed</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Leung</surname><given-names>Tiffany</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Martin</surname><given-names>Vincent</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Wang</surname><given-names>Zhepei</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Yan Fossat, MSc, Klick Applied Sciences, 175 Bloor St East, North Tower, 3rd floor, Toronto, ON, M4W3R8, Canada, 1 6472068717; <email>yfossat@klick.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>26</day><month>6</month><year>2025</year></pub-date><volume>10</volume><elocation-id>e64357</elocation-id><history><date date-type="received"><day>15</day><month>07</month><year>2024</year></date><date date-type="rev-recd"><day>03</day><month>06</month><year>2025</year></date><date date-type="accepted"><day>04</day><month>06</month><year>2025</year></date></history><copyright-statement>&#x00A9; Atousa Assadi, Jessica Oreskovic, Jaycee Kaufman, Yan Fossat. Originally published in JMIR Biomedical Engineering (<ext-link ext-link-type="uri" xlink:href="http://biomsedeng.jmir.org">http://biomsedeng.jmir.org</ext-link>), 26.6.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Biomedical Engineering, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://biomedeng.jmir.org/">https://biomedeng.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://biomedeng.jmir.org/2025/1/e64357"/><abstract><sec><title>Background</title><p>The use of acoustic biomarkers derived from speech signals is a promising non-invasive technique for diagnosing type 2 diabetes mellitus (T2DM). Despite its potential, there remains a critical gap in knowledge regarding the optimal number of voice recordings and recording schedule necessary to achieve effective diagnostic accuracy.</p></sec><sec><title>Objective</title><p>This study aimed to determine the optimal number of voice samples and the ideal recording schedule (frequency and timing), required to maintain the T2DM diagnostic efficacy while reducing patient burden.</p></sec><sec sec-type="methods"><title>Methods</title><p>We analyzed voice recordings from 78 adults (22 women), including 39 individuals diagnosed with T2DM. Participants had a mean (SD) age of 45.26 (10.63) years and mean (SD) BMI of 28.07 (4.59) kg/m&#x00B2;. In total, 5035 voice recordings were collected, with a mean (SD) of 4.91 (1.45) recordings per day; higher adherence was observed among women (5.13 [1.38] vs 4.82 [1.46] in men). We evaluated the diagnostic accuracy of a previously developed voice-based model under different recording conditions. Segmented linear regression analysis was used to assess model accuracy across varying numbers of voice recordings, and the Kendall tau correlation was used to measure the relationship between recording settings and accuracy. A significance threshold of <italic>P</italic>&#x003C;.05 was applied.</p></sec><sec sec-type="results"><title>Results</title><p>Our results showed that including up to 6 voice recordings notably improved the model accuracy for T2DM compared to using only one recording, with accuracy increasing from 59.61 to 65.02 for men and from 65.55 to 69.43 for women. Additionally, the day on which voice recordings were collected did not significantly affect model accuracy (<italic>P</italic>&#x003E;.05). However, adhering to recording within a single day demonstrated higher accuracy, with accuracy of 73.95% for women and 85.48% for men when all recordings were from the first and second days.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study underscores the optimal voice recording settings to reduce patient burden while maintaining diagnostic efficacy.</p></sec></abstract><kwd-group><kwd>vocal biomarker</kwd><kwd>acoustic biomarker</kwd><kwd>voice analysis</kwd><kwd>type 2 diabetes</kwd><kwd>diagnostics</kwd><kwd>digital phenotyping</kwd><kwd>voice data</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Diabetes mellitus is a chronic metabolic disorder characterized by persistent elevated blood glucose levels due to inadequate or impaired insulin production or utilization. It affects 10.5% of the worldwide population (536.6 million people) [<xref ref-type="bibr" rid="ref1">1</xref>], with type 2 diabetes mellitus (T2DM) accounting for 90% of cases [<xref ref-type="bibr" rid="ref2">2</xref>]. Uncontrolled diabetes is a major contributors to cardiovascular disorders, blindness, renal failure, and lower limb amputation [<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>Traditional diagnostic methods of fasting plasma glucose and oral glucose tolerance tests involve blood sampling, which can cause inconvenience or discomfort to patients owing to frequent monitoring. Moreover, the lack of a glucometer and the time spent for self-testing are barriers in the self-management of diabetes [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. In response to these challenges, acoustic biomarkers from speech signals have emerged as promising non-invasive alternatives, offering a convenient solution for diagnosing and monitoring diabetes, especially for individuals in remote areas with restricted health care accessibility.</p><p>Sustained periods of high blood glucose and the detrimental effects of peripheral neuropathy and myopathy in individuals with T2DM impact the elastic properties of the vocal folds [<xref ref-type="bibr" rid="ref5">5</xref>], weaken the laryngeal muscles, and induce respiratory changes [<xref ref-type="bibr" rid="ref6">6</xref>]. These physiological changes can affect voice parameters, leading to voice disorders like hoarseness [<xref ref-type="bibr" rid="ref7">7</xref>] and dysphagia [<xref ref-type="bibr" rid="ref8">8</xref>]. Consequently, compared to those without T2DM, individuals with the condition exhibit significant vocal differences, quantified by phonation time, fundamental frequency, jitters, and shimmers [<xref ref-type="bibr" rid="ref6">6</xref>], highlighting the importance of investigating vocal variations as potential markers of T2DM [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref13">13</xref>].</p><p>Our group previously assessed the feasibility of using voice recordings from mobile applications to detect T2DM [<xref ref-type="bibr" rid="ref14">14</xref>]. Our results demonstrated that voice biomarkers&#x2014;specifically pitch, jitters, and shimmers&#x2014;combined with age and BMI could predict T2DM with an accuracy of 0.89 for women and 0.86 for men [<xref ref-type="bibr" rid="ref14">14</xref>]. However, requiring participants to record their voices at least 6 times daily over a 2-week period posed challenges related to participant burden and recording consistency.</p><p>Therefore, this study aims to optimize the voice sampling process by determining (1) the minimum number of voice samples required, and (2) the optimal recording schedule (frequency and timing) needed to maintain diagnostic accuracy while reducing participant burden. We hypothesize that a more streamlined voice sampling protocol can achieve comparable predictive performance to prior studies while improving feasibility for long-term diabetes monitoring.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>To address the objectives of this project, we designed a retrospective study based on our previously developed model and the same dataset that yielded the highest balanced accuracy [<xref ref-type="bibr" rid="ref14">14</xref>]. The original data collection took place between August 30, 2021, and June 30, 2022 in India [<xref ref-type="bibr" rid="ref14">14</xref>]. In total, 505 participants (mean [SD] age 41.03 [13.29] years, 336 male participants) were recruited and instructed to record a short English phrase (&#x201C;Hello. How are you? What is my glucose level right now?&#x201D;) up to 6 times daily using their smartphone for 14 consecutive days.</p></sec><sec id="s2-2"><title>Participants and Measurements</title><p>A balanced subset of the original dataset was used for this analysis and included 78 participants (aged &#x003E;18 years old, 22 women), with 39 diagnosed with T2DM [<xref ref-type="bibr" rid="ref14">14</xref>]. Participants in the T2DM and non-T2DM groups were matched for age and BMI to minimize the demographic impact on voice recordings (<xref ref-type="table" rid="table1">Table 1</xref>). A T2DM diagnosis was confirmed by a physician according to the American Diabetes Association guidelines [<xref ref-type="bibr" rid="ref15">15</xref>]. All participants were nonsmokers, had no diagnosed neurological or speech impairments, and signed the consent forms.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Patient demographic characteristics.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom">Total</td><td align="left" valign="bottom">Non-T2DM<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> group</td><td align="left" valign="bottom">T2DM group</td></tr></thead><tbody><tr><td align="left" valign="top">N (%)</td><td align="left" valign="top">78 (100.0)</td><td align="left" valign="top">39 (50.0)</td><td align="left" valign="top">39 (50.0)</td></tr><tr><td align="left" valign="top">&#x2003;Women</td><td align="left" valign="top">22 (28.21)</td><td align="left" valign="top">11 (50.0)</td><td align="left" valign="top">11 (50.0)</td></tr><tr><td align="left" valign="top">&#x2003;Men</td><td align="left" valign="top">56 (71.79)</td><td align="left" valign="top">28 (50.0)</td><td align="left" valign="top">28 (50.0)</td></tr><tr><td align="left" valign="top">Age (years), mean (SD)</td><td align="left" valign="top">45.26 (10.63)</td><td align="left" valign="top">45.49 (10.8)</td><td align="left" valign="top">45.03 (10.58)</td></tr><tr><td align="left" valign="top">&#x2003;Women</td><td align="left" valign="top">45.82 (10.4)</td><td align="left" valign="top">45.91 (10.85)</td><td align="left" valign="top">45.73 (10.47)</td></tr><tr><td align="left" valign="top">&#x2003;Men</td><td align="left" valign="top">45.04 (10.8)</td><td align="left" valign="top">45.32 (10.98)</td><td align="left" valign="top">44.75 (10.8)</td></tr><tr><td align="left" valign="top">BMI (kg/m<sup>2</sup>), mean (SD)</td><td align="left" valign="top">28.07 (4.59)</td><td align="left" valign="top">28.77 (5.01)</td><td align="left" valign="top">27.36 (4.06)</td></tr><tr><td align="left" valign="top">&#x2003;Women</td><td align="left" valign="top">30.25 (5.35)</td><td align="left" valign="top">31.41 (5.4)</td><td align="left" valign="top">29.09 (5.29)</td></tr><tr><td align="left" valign="top">&#x2003;Men</td><td align="left" valign="top">27.21 (3.98)</td><td align="left" valign="top">27.74 (4.53)</td><td align="left" valign="top">26.68 (3.34)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>T2DM: type 2 diabetes mellitus.</p></fn></table-wrap-foot></table-wrap><p>As part of the study protocol, participants recorded their voice at least 6 times per day over a 2-week period using a custom mobile application installed on their personal cell phones. These recordings took place either at home or in a quiet environment with minimal background noise [<xref ref-type="bibr" rid="ref12">12</xref>]. To establish a consistent starting point, a participant&#x2019;s first day (d01) was defined as the day they recorded at least 2 voice samples. Voice samples recorded prior to d01 were excluded from the analysis.</p></sec><sec id="s2-3"><title>Optimizing Voice Recording Quantity and Settings for Enhanced Model Accuracy</title><p>To analyze the collected voice recordings, 14 acoustic features were extracted to characterize key parameters related to pitch, intensity, harmonic noise ratio, shimmers, and jitters [<xref ref-type="bibr" rid="ref14">14</xref>]. Features that were significantly different between the T2DM and non-T2DM groups (<italic>P</italic>&#x003C;.05, Cohen <italic>d</italic> &#x003E;0.02) were included in he model development pipeline, with separate models for women and men. For women, the key features were pitch SD, mean pitch, RAP jitter, and apq3 shimmer, while for men, mean intensity, apq11 shimmer, intensity SD, and ppq5 jitter were used. A 5-fold cross-validation was performed for feature selection, threshold determination, and model optimization based on the best predictive balanced accuracy [<xref ref-type="bibr" rid="ref14">14</xref>]. The optimal model for women was a logistic regression model (threshold of 0.3) with BMI and 3 voice features: mean pitch, pitch SD, and RAP jitter. For men, the optimal model was a naive Bayes classifier (threshold of 0.215) with age, BMI, and 2 voice features: mean intensity and apq11 shimmer.</p><p>The analysis pipeline included (1) indicating the optimal number of voice recordings for effective T2DM classification based on changes in model accuracy across varying quantities of voice samples, and (2) studying the effect of voice recording configurations on predictive performance (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>To study the changes in the model&#x2019;s accuracy trend across varying number of voice samples, we employed segmented linear regression by fitting two distinct linear models to the data before and after the n voice samples breakpoint. The Kendall tau measure of correlation was used to investigate the strength and direction of the relationship between ordinal variables (such as days) and model accuracy. <italic>P</italic> values of .05 were considered statistically significant.</p></sec><sec id="s2-4"><title>Ethical Considerations</title><p>The protocol (ID MGCTS107) received ethics approval by Saanvi Ethical Research LLP (No. MGCTS/20/107 V01), all participants provided informed consent, and data were stored in a secure cloud database with no identifying information. Participants were compensated for their time; each participant received US $56.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Participants and Measurements</title><p>The mean (SD) age and mean (SD) BMI of participants were 45.26 (10.63) years and 28.07 (4.59) kg/m<sup>2</sup>, respectively (<xref ref-type="table" rid="table1">Table 1</xref>). In total, 5035 recordings were included in the analysis, and 2620 from participants with T2DM (<xref ref-type="table" rid="table2">Table 2</xref>). The mean (SD) number of daily recordings for all participants was 4.91 (1.45) with women more adherent to the protocol than men (5.13 [1.38] vs 4.82 [1.46], <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>, <xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Voice recording data.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom">Total</td><td align="left" valign="bottom">Non-T2DM<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> group</td><td align="left" valign="bottom">T2DM group</td></tr></thead><tbody><tr><td align="left" valign="top">N (%)</td><td align="left" valign="top">5035 (100)</td><td align="left" valign="top">2415 (48)</td><td align="left" valign="top">2620 (52)</td></tr><tr><td align="left" valign="top">&#x2003;Women, n (%)</td><td align="left" valign="top">1539 (30.6)</td><td align="left" valign="top">713 (46.3)</td><td align="left" valign="top">826 (53.7)</td></tr><tr><td align="left" valign="top">&#x2003;Men, n (%)</td><td align="left" valign="top">3496 (69.4)</td><td align="left" valign="top">1702 (48.7)</td><td align="left" valign="top">1794 (51.3)</td></tr><tr><td align="left" valign="top">Number of recordings per participant, mean (SD)</td><td align="left" valign="top">64.55 (19.53)</td><td align="left" valign="top">61.92 (21.67)</td><td align="left" valign="top">67.18 (17)</td></tr><tr><td align="left" valign="top">&#x2003;Women</td><td align="left" valign="top">69.95 (16.26)</td><td align="left" valign="top">64.82 (19.12)</td><td align="left" valign="top">75.09 (11.45)</td></tr><tr><td align="left" valign="top">&#x2003;Men</td><td align="left" valign="top">62.43 (20.42)</td><td align="left" valign="top">60.79 (22.82)</td><td align="left" valign="top">64.07 (17.97)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>T2DM: type 2 diabetes mellitus.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>The accuracy of the model using different number of voice recordings. The lines present the average accuracy for men (blue) and women (red). The shaded area shows the confidence interval. The numbers in the figure show the number of participants whose data were included in the analysis per day.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="biomedeng_v10i1e64357_fig01.png"/></fig></sec><sec id="s3-2"><title>Optimizing Voice Recording Quantity and Settings for Enhanced Model Accuracy</title><p>Both in men and women, the model accuracy improved with the inclusion of up to 6 voice samples, after which it stabilized with no significant improvement (<xref ref-type="fig" rid="figure1">Figure 1</xref>). The changes in the slope of the linear fit were &#x2212;1.15 for men and &#x2212;0.65 for women, indicating a faster accuracy improvement in men than in women with the addition of initial voice samples.</p><p>Considering 6 voice samples for effective T2DM diagnosis, the highest model accuracy was achieved with recordings from day 1 in men, while for women, the peak accuracy was observed with recordings from day 10 (<xref ref-type="fig" rid="figure2">Figure 2</xref>). However, the variations in model accuracy across different days were not significant, and no statistically discernible trend was observed (<italic>P</italic>=.23 for men, <italic>P</italic>=.27 for women). The model accuracy was generally higher for women than for men on most days, although the difference was not statistically significant, as indicated by the overlapping confidence intervals.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>The accuracy of the model using 6 voice recordings per day. d: day.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="biomedeng_v10i1e64357_fig02.png"/></fig><p>Moreover, we observed that the model accuracy was higher in men than in women when the majority of recordings were from the first day (<xref ref-type="fig" rid="figure3">Figure 3</xref>). As the distribution of recordings were balanced between the first and second days, the accuracy gap between men and women narrowed. Finally, when the majority of recordings were from the second day, the model accuracy was slightly higher for women than for men, with the differences in accuracy levels becoming less pronounced. Our statistical test indicated no significant trend in the model accuracy for men when using 6 recordings across 2 days (<italic>P</italic>&#x003E;.99). For women, there was a significant increasing trend in the model accuracy when the majority of recordings were taken on the second day (<italic>P</italic>=.03), suggesting that consistent participation in women can improve the model performance.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>The accuracy of the model using total 6 voice recordings from day 1 and day 2. D1: day 1, D2: day 2, N: number of samples from the day.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="biomedeng_v10i1e64357_fig03.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This research, to our knowledge, is the first to investigate the optimal balance between the number and settings of voice recordings for effective T2DM diagnosis, with the goal of reducing patient burden. Our findings indicated that 6 voice recordings are sufficient to maintain diagnostic accuracy, improving patient compliance and accessibility for T2DM screening. No significant differences in model accuracy were observed across different days while adherence to recording in a single day showed higher accuracy. This study lays the groundwork for future research and clinical applications focused on optimizing health care delivery for T2DM.</p></sec><sec id="s4-2"><title>Comparison to Prior Works</title><p>Previous studies have shown that an increased burden from the treatment and self-management of chronic health conditions such as T2DM is associated with higher levels of distress, lower adherence to self-care routines, decreased satisfaction with medications, reduced quality of life, poorer physical and mental health, and greater risk of complications and deaths [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. In alignment with these, our study demonstrated that up to 6 voice recordings are sufficient to effectively diagnose T2DM, thereby reducing patient burden while maintaining diagnostic accuracy.</p><p>There are conflicting reports on self-management among men and women. While Zhou et al [<xref ref-type="bibr" rid="ref19">19</xref>] observed that women exhibited greater compliance in self-care than men did, Mogre et al [<xref ref-type="bibr" rid="ref20">20</xref>] reported higher self-monitoring of blood glucose in men. In our study, despite the lower number of women participants than men, women showed a higher adherence to the voice recording protocol. This higher adherence among women may explain the observed increase in model accuracy, as recordings were distributed across 2 days, suggesting that consistent participation enhances the model performance.</p><p>Prior research has reported no significant day-to-day variability in voice recordings while there exists a significant time-of-day influence on acoustics with voice quality enhanced with increased voice use [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. In alignment with these findings, our results showed that both in men and in women, the model accuracy was not significantly different between days while there was an increase in accuracy when the majority of the recordings were from a single day. Due to the limited distribution of samples across different times of the day, we were unable to assess the time-of-day variability.</p></sec><sec id="s4-3"><title>Strengths and Limitations</title><p>This study provides important insights into optimizing voice-based T2DM diagnostics while minimizing participant burden. However, several limitations should be considered. First, there was a limited sample size of women. The smaller number of women participants may reduce the generalizability of our findings, particularly regarding sex-specific effects. Future studies with larger, more balanced datasets are needed to validate these observations. Second, our relatively small dataset limited the use of more advanced machine learning techniques, such as neural networks. While these models may offer further improvements in the diagnostic accuracy and insight into optimal data collection strategies, future studies with larger datasets are required to fully explore their potential. Third, due to uneven distribution of recordings across different times of the day, we could not assess how the time-of-day influences voice-based diagnostics. Future studies should implement controlled recording schedules to systematically examine these effects.</p></sec></sec></body><back><ack><p>This research was internally funded by Klick Inc.</p></ack><notes><sec><title>Data Availability</title><p>Data were commissioned by Klick Health, a private business, and are owned by Klick who does not allow sharing them.</p></sec></notes><fn-group><fn fn-type="con"><p>All authors contributed to preparing this manuscript. AA selected the analysis pipeline, performed data analysis, and prepared the manuscript. JO contributed to data analysis and revised and edited the manuscript. JK developed the voice classification model and provided feedback in methodology, data analysis, and reviewing the manuscript. YF supervised all aspects of the project, provided funding resources, and was involved in reviewing and submitting the manuscript.</p></fn><fn fn-type="conflict"><p>JO, JK, and YF are employees of Klick Inc.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">T2DM</term><def><p>type 2 diabetes mellitus</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sun</surname><given-names>H</given-names> </name><name name-style="western"><surname>Saeedi</surname><given-names>P</given-names> </name><name name-style="western"><surname>Karuranga</surname><given-names>S</given-names> </name><etal/></person-group><article-title>IDF diabetes atlas: Global, regional and country-level diabetes prevalence estimates for 2021 and projections for 2045</article-title><source>Diabetes Res Clin Pract</source><year>2022</year><month>01</month><volume>183</volume><fpage>109119</fpage><pub-id pub-id-type="doi">10.1016/j.diabres.2021.109119</pub-id><pub-id pub-id-type="medline">34879977</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Goyal</surname><given-names>R</given-names> </name><name name-style="western"><surname>Singhal</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jialal</surname><given-names>I</given-names> </name></person-group><source>Type 2 Diabetes</source><year>2024</year><access-date>2025-06-25</access-date><publisher-name>StatPearls</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK513253/">https://www.ncbi.nlm.nih.gov/books/NBK513253/</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mogre</surname><given-names>V</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Tzelepis</surname><given-names>F</given-names> </name><name name-style="western"><surname>Paul</surname><given-names>C</given-names> </name></person-group><article-title>Barriers to diabetic self-care: a qualitative study of patients&#x2019; and healthcare providers&#x2019; perspectives</article-title><source>J Clin Nurs</source><year>2019</year><month>06</month><volume>28</volume><issue>11-12</issue><fpage>2296</fpage><lpage>2308</lpage><pub-id pub-id-type="doi">10.1111/jocn.14835</pub-id><pub-id pub-id-type="medline">30791160</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gonzalez</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Tanenbaum</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Commissariat</surname><given-names>PV</given-names> </name></person-group><article-title>Psychosocial factors in medication adherence and diabetes self-management: Implications for research and practice</article-title><source>Am Psychol</source><year>2016</year><month>10</month><volume>71</volume><issue>7</issue><fpage>539</fpage><lpage>551</lpage><pub-id pub-id-type="doi">10.1037/a0040388</pub-id><pub-id pub-id-type="medline">27690483</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sidorova</surname><given-names>J</given-names> </name><name name-style="western"><surname>Carbonell</surname><given-names>P</given-names> </name><name name-style="western"><surname>&#x010C;uki&#x0107;</surname><given-names>M</given-names> </name></person-group><article-title>Blood glucose estimation from voice: first review of successes and challenges</article-title><source>J Voice</source><year>2022</year><month>09</month><volume>36</volume><issue>5</issue><fpage>737</fpage><pub-id pub-id-type="doi">10.1016/j.jvoice.2020.08.034</pub-id><pub-id pub-id-type="medline">33041176</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saghiri</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Vakhnovetsky</surname><given-names>A</given-names> </name><name name-style="western"><surname>Vakhnovetsky</surname><given-names>J</given-names> </name></person-group><article-title>Scoping review of the relationship between diabetes and voice quality</article-title><source>Diabetes Res Clin Pract</source><year>2022</year><month>03</month><volume>185</volume><fpage>109782</fpage><pub-id pub-id-type="doi">10.1016/j.diabres.2022.109782</pub-id><pub-id pub-id-type="medline">35176400</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hamdan</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Kurban</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Azar</surname><given-names>ST</given-names> </name></person-group><article-title>Prevalence of phonatory symptoms in patients with type 2 diabetes mellitus</article-title><source>Acta Diabetol</source><year>2013</year><month>10</month><volume>50</volume><issue>5</issue><fpage>731</fpage><lpage>736</lpage><pub-id pub-id-type="doi">10.1007/s00592-012-0392-3</pub-id><pub-id pub-id-type="medline">22527095</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weinreb</surname><given-names>SF</given-names> </name><name name-style="western"><surname>Piersiala</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hillel</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Akst</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Best</surname><given-names>SR</given-names> </name></person-group><article-title>Dysphonia and dysphagia as early manifestations of autoimmune inflammatory myopathy</article-title><source>Am J Otolaryngol</source><year>2021</year><volume>42</volume><issue>1</issue><fpage>102747</fpage><pub-id pub-id-type="doi">10.1016/j.amjoto.2020.102747</pub-id><pub-id pub-id-type="medline">33038783</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pinyopodjanard</surname><given-names>S</given-names> </name><name name-style="western"><surname>Suppakitjanusant</surname><given-names>P</given-names> </name><name name-style="western"><surname>Lomprew</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kasemkosin</surname><given-names>N</given-names> </name><name name-style="western"><surname>Chailurkit</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ongphiphadhanakul</surname><given-names>B</given-names> </name></person-group><article-title>Instrumental acoustic voice characteristics in adults with type 2 diabetes</article-title><source>J Voice</source><year>2021</year><month>01</month><volume>35</volume><issue>1</issue><fpage>116</fpage><lpage>121</lpage><pub-id pub-id-type="doi">10.1016/j.jvoice.2019.07.003</pub-id><pub-id pub-id-type="medline">31427120</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>G&#x00F6;la&#x00E7;</surname><given-names>H</given-names> </name><name name-style="western"><surname>Atalik</surname><given-names>G</given-names> </name><name name-style="western"><surname>T&#x00FC;rkcan</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Yilmaz</surname><given-names>M</given-names> </name></person-group><article-title>Disease related changes in vocal parameters of patients with type 2 diabetes mellitus</article-title><source>Logoped Phoniatr Vocol</source><year>2022</year><month>10</month><volume>47</volume><issue>3</issue><fpage>202</fpage><lpage>208</lpage><pub-id pub-id-type="doi">10.1080/14015439.2021.1917653</pub-id><pub-id pub-id-type="medline">33970753</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Chitkara</surname><given-names>D</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>RK</given-names> </name></person-group><article-title>Voice based detection of type 2 diabetes mellitus</article-title><conf-name>2016 2nd International Conference on Advances in Electrical, Electronics, Information, Communication and Bio-Informatics (AEEICB)</conf-name><conf-date>Feb 27-28, 2016</conf-date><conf-loc>Chennai, India</conf-loc><fpage>83</fpage><lpage>87</lpage><pub-id pub-id-type="doi">10.1109/AEEICB.2016.7538402</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaufman</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jeon</surname><given-names>J</given-names> </name><name name-style="western"><surname>Oreskovic</surname><given-names>J</given-names> </name><name name-style="western"><surname>Fossat</surname><given-names>Y</given-names> </name></person-group><article-title>Linear effects of glucose levels on voice fundamental frequency in type 2 diabetes and individuals with normoglycemia</article-title><source>Sci Rep</source><year>2024</year><month>08</month><day>28</day><volume>14</volume><issue>1</issue><fpage>19012</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-69620-z</pub-id><pub-id pub-id-type="medline">39198592</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oreskovic</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kaufman</surname><given-names>J</given-names> </name><name name-style="western"><surname>Fossat</surname><given-names>Y</given-names> </name></person-group><article-title>Impact of audio data compression on feature extraction for vocal biomarker detection: validation study</article-title><source>JMIR Biomed Eng</source><year>2024</year><month>04</month><day>15</day><volume>9</volume><fpage>e56246</fpage><pub-id pub-id-type="doi">10.2196/56246</pub-id><pub-id pub-id-type="medline">38875677</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaufman</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Thommandram</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fossat</surname><given-names>Y</given-names> </name></person-group><article-title>Acoustic analysis and prediction of type 2 diabetes mellitus using smartphone-recorded voice segments</article-title><source>Mayo Clin Proc Digit Health</source><year>2023</year><month>12</month><volume>1</volume><issue>4</issue><fpage>534</fpage><lpage>544</lpage><pub-id pub-id-type="doi">10.1016/j.mcpdig.2023.08.005</pub-id><pub-id pub-id-type="medline">40206319</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association Professional Practice Committee</collab></person-group><article-title>2. Classification and diagnosis of diabetes: standards of medical care in diabetes-2022</article-title><source>Diabetes Care</source><year>2022</year><month>01</month><day>1</day><volume>45</volume><issue>Suppl 1</issue><fpage>S17</fpage><lpage>S38</lpage><pub-id pub-id-type="doi">10.2337/dc22-S002</pub-id><pub-id pub-id-type="medline">34964875</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eton</surname><given-names>DT</given-names> </name><name name-style="western"><surname>Yost</surname><given-names>KJ</given-names> </name><name name-style="western"><surname>Lai</surname><given-names>JS</given-names> </name><etal/></person-group><article-title>Development and validation of the patient experience with treatment and self-management (PETS): a patient-reported measure of treatment burden</article-title><source>Qual Life Res</source><year>2017</year><month>02</month><volume>26</volume><issue>2</issue><fpage>489</fpage><lpage>503</lpage><pub-id pub-id-type="doi">10.1007/s11136-016-1397-0</pub-id><pub-id pub-id-type="medline">27566732</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jannoo</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Mamode Khan</surname><given-names>N</given-names> </name></person-group><article-title>Medication adherence and diabetes self-care activities among patients with type 2 diabetes mellitus</article-title><source>Value Health Reg Issues</source><year>2019</year><month>05</month><volume>18</volume><fpage>30</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.1016/j.vhri.2018.06.003</pub-id><pub-id pub-id-type="medline">30419448</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Sloan</surname><given-names>FA</given-names> </name><name name-style="western"><surname>Yashkin</surname><given-names>AP</given-names> </name></person-group><article-title>Adherence to diabetes guidelines for screening, physical activity and medication and onset of complications and death</article-title><source>J Diabetes Complications</source><year>2015</year><volume>29</volume><issue>8</issue><fpage>1228</fpage><lpage>1233</lpage><pub-id pub-id-type="doi">10.1016/j.jdiacomp.2015.07.005</pub-id><pub-id pub-id-type="medline">26316423</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>C</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Relationship between self-care compliance, trust, and satisfaction among hypertensive patients in China</article-title><source>Front Public Health</source><year>2022</year><volume>10</volume><fpage>1085047</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2022.1085047</pub-id><pub-id pub-id-type="medline">36743158</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mogre</surname><given-names>V</given-names> </name><name name-style="western"><surname>Abanga</surname><given-names>ZO</given-names> </name><name name-style="western"><surname>Tzelepis</surname><given-names>F</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Paul</surname><given-names>C</given-names> </name></person-group><article-title>Adherence to and factors associated with self-care behaviours in type 2 diabetes patients in Ghana</article-title><source>BMC Endocr Disord</source><year>2017</year><month>03</month><day>24</day><volume>17</volume><issue>1</issue><fpage>20</fpage><pub-id pub-id-type="doi">10.1186/s12902-017-0169-3</pub-id><pub-id pub-id-type="medline">28340613</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Heald</surname><given-names>SLM</given-names> </name><name name-style="western"><surname>Nusbaum</surname><given-names>HC</given-names> </name></person-group><article-title>Variability in vowel production within and between days</article-title><source>PLoS ONE</source><year>2015</year><volume>10</volume><issue>9</issue><fpage>e0136791</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0136791</pub-id><pub-id pub-id-type="medline">26331478</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pierce</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Tanner</surname><given-names>K</given-names> </name><name name-style="western"><surname>Merrill</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Shnowske</surname><given-names>L</given-names> </name><name name-style="western"><surname>Roy</surname><given-names>N</given-names> </name></person-group><article-title>Acoustic variability in the healthy female voice within and across days: how much and why?</article-title><source>J Speech Lang Hear Res</source><year>2021</year><month>08</month><day>9</day><volume>64</volume><issue>8</issue><fpage>3015</fpage><lpage>3031</lpage><pub-id pub-id-type="doi">10.1044/2021_JSLHR-21-00018</pub-id><pub-id pub-id-type="medline">34269598</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Methods for optimizing voice recording quantity and settings for enhanced model accuracy.</p><media xlink:href="biomedeng_v10i1e64357_app1.docx" xlink:title="DOCX File, 15 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Number of daily voice recordings per participant.</p><media xlink:href="biomedeng_v10i1e64357_app2.docx" xlink:title="DOCX File, 135 KB"/></supplementary-material></app-group></back></article>