<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMBE</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Biomed Eng</journal-id>
      <journal-title>JMIR Biomedical Engineering</journal-title>
      <issn pub-type="epub">2561-3278</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v5i1e20506</article-id>
      <article-id pub-id-type="pmid"/>
      <article-id pub-id-type="doi">10.2196/20506</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Interpretation of Maturity-Onset Diabetes of the Young Genetic Variants Based on American College of Medical Genetics and Genomics Criteria: Machine-Learning Model Development</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Kukafka</surname>
            <given-names>Rita</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Doogan</surname>
            <given-names>Caitlin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Palmieri</surname>
            <given-names>Flavio</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Yichuan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1899-2082</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Qu</surname>
            <given-names>Hui-Qi</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9317-4488</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Wenocur</surname>
            <given-names>Adam S</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9491-0678</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Qu</surname>
            <given-names>Jingchun</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1974-2496</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Chang</surname>
            <given-names>Xiao</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0230-0416</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Glessner</surname>
            <given-names>Joseph</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5131-2811</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Sleiman</surname>
            <given-names>Patrick</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9874-8532</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Tian</surname>
            <given-names>Lifeng</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1880-5811</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Hakonarson</surname>
            <given-names>Hakon</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Center for Applied Genomics</institution>
            <institution>Children's Hospital of Philadelphia</institution>
            <addr-line>3615 Civic Center Blvd</addr-line>
            <addr-line>Philadelphia, PA, 19104</addr-line>
            <country>United States</country>
            <phone>1 267 426 0088</phone>
            <fax>1 267 426 0363</fax>
            <email>hakonarson@email.chop.edu</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2814-7461</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Center for Applied Genomics</institution>
        <institution>Children's Hospital of Philadelphia</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Texas A&amp;M University</institution>
        <addr-line>College Station, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Human Genetics</institution>
        <institution>Children's Hospital of Philadelphia</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Division of Human Genetics, Department of Pediatrics</institution>
        <institution>The Perelman School of Medicine</institution>
        <institution>University of Pennsylvania</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hakon Hakonarson <email>hakonarson@email.chop.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jan-Dec</season>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>1</day>
        <month>12</month>
        <year>2020</year>
      </pub-date>
      <volume>5</volume>
      <issue>1</issue>
      <elocation-id>e20506</elocation-id>
      <history>
        <date date-type="received">
          <day>30</day>
          <month>5</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>22</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>19</day>
          <month>7</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>3</day>
          <month>11</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Yichuan Liu, Hui-Qi Qu, Adam S Wenocur, Jingchun Qu, Xiao Chang, Joseph Glessner, Patrick Sleiman, Lifeng Tian, Hakon Hakonarson. Originally published in JMIR Biomedical Engineering (http://biomedeng.jmir.org), 01.12.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Biomedical Engineering, is properly cited. The complete bibliographic information, a link to the original publication on http://biomedeng.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://biomedeng.jmir.org/2020/1/e20506/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Maturity-onset diabetes of the young (MODY) is a group of dominantly inherited monogenic diabetes, with <italic>HNF4A</italic>-MODY, <italic>GCK</italic>-MODY, and <italic>HNF1A</italic>-MODY as the three most common forms based on the causal genes. Molecular diagnosis of MODY is important for precise treatment. Although a DNA variant causing MODY can be assessed based on the criteria of the American College of Medical Genetics and Genomics (ACMG) guidelines, gene-specific assessment of disease-causing mutations is important to differentiate among MODY subtypes. As the ACMG criteria were not originally designed for machine-learning algorithms, they are not true independent variables.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to develop machine-learning models for interpretation of DNA variants and MODY diagnosis using the ACMG criteria.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We applied machine-learning models for interpretation of DNA variants in MODY genes defined by the ACMG criteria based on the Human Gene Mutation Database (HGMD) and ClinVar database.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>With a machine-learning procedure, we found that the weight matrix of the ACMG criteria was significantly different between the three MODY genes <italic>HNF1A</italic>, <italic>HNF4A</italic>, and <italic>GCK</italic>. The models showed high predictive abilities with accuracy over 95%.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our results highlight the need for applying different weights of the ACMG criteria in relation to different MODY genes for accurate functional classification. As proof of principle, we applied the ACMG criteria as feature vectors in a machine-learning model and obtained a precision-based result.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>genetics</kwd>
        <kwd>genomics</kwd>
        <kwd>machine learning</kwd>
        <kwd>medicine</kwd>
        <kwd>maturity-onset diabetes of the young</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Monogenic diabetes results from DNA mutations in a single gene, which accounts for about 1%-4% of all cases of diabetes in the United States [<xref ref-type="bibr" rid="ref1">1</xref>]. The most common form of monogenic diabetes is maturity-onset diabetes of the young (MODY), an autosomal dominant disease that most commonly occurs in adolescence or early adulthood [<xref ref-type="bibr" rid="ref2">2</xref>]. Genetic sequencing is needed to identify the causal mutations and to diagnose different subtypes of MODYs [<xref ref-type="bibr" rid="ref3">3</xref>]. The DNA variant causing MODY can be specifically assessed using the criteria established by the American College of Medical Genetics and Genomics (ACMG), as published in their guidelines [<xref ref-type="bibr" rid="ref4">4</xref>]. Although the ACMG guidelines can be universally applied for all human DNA variants, our previous study suggested that a gene-specific assessment is important for identifying disease-causing mutations in different MODY genes [<xref ref-type="bibr" rid="ref5">5</xref>]. In addition, contradictory evidence is commonly seen in functional classification of genetic variations when using the ACMG guidelines [<xref ref-type="bibr" rid="ref6">6</xref>]. The ACMG guidelines may suggest a variant of uncertain significance; however, classification of the variant may have contradictory evidence, and some variants with contradictory evidence may turn out to have a reliable definite classification.</p>
      <p>Machine learning has been advocated as an important tool for both clinical and research purposes in human diseases [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. In this study, we aimed to develop machine-learning models for interpretation of DNA variants using the ACMG criteria, with a focus on DNA variants of three MODY genes (<italic>HNF1A</italic>, <italic>HNF4A</italic>, and <italic>GCK</italic>) underlying the three most common types of MODYs [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection for Machine-Learning Procedures</title>
        <p>Known DNA variants of the three MODY genes <italic>HNF1A</italic>, <italic>HNF4A</italic>, and <italic>GCK</italic> were acquired from the dbSNP [<xref ref-type="bibr" rid="ref10">10</xref>], the ClinVar database [<xref ref-type="bibr" rid="ref11">11</xref>], and the Human Gene Mutation Database (HGMD) 2019 professional version [<xref ref-type="bibr" rid="ref12">12</xref>]. Among the multihundred variants reported in these genes, approximately half have a classification of pathogenic/likely pathogenic (P/LP) according to the annotation in ClinVar or HGMD. According to the HGMD, the three genes were curated by Professor Andrew Hattersley, a leading genetic expert in MODYs [<xref ref-type="bibr" rid="ref13">13</xref>]. The classification of variants as benign/likely benign (B/LB) varies between the different databases according to the annotation of ClinVar or dbSNP. Overall, for the three genes, there are 899 unique variants reported in <italic>HNF1A</italic>, including 569 P/LP sites and 330 B/LB sites; 1037 unique variants for <italic>HNF4A</italic>, including 182 P/LP sites and 855 B/LB sites; and 1664 unique variants for <italic>GCK</italic>, including 1065 P/LP sites and 599 B/LB sites. However, several of these variants have different annotation features between the different databases.</p>
      </sec>
      <sec>
        <title>Feature Vector Generation</title>
        <p>The feature vectors used for machine-learning modeling were the criteria based on the ACMG guidelines [<xref ref-type="bibr" rid="ref14">14</xref>]. The criteria terms were generated based on InterVar [<xref ref-type="bibr" rid="ref15">15</xref>], a computational tool that uses a preannotated or variant call format file as an input and generates automated interpretation based on the ACMG criteria. It should be noted that not all 33 ACMG criteria can be computationally scored. For example, the PS3 criterion requires well-established in vitro or in vivo functional studies supportive of a damaging effect on the gene or gene product. As a result, the following 15 ACMG criteria were used, which was also the length of feature vectors for the three MODY genes: PVS1, PS1, PS4, PM1, PM2, PM4, PM5, PP2, PP3, PP5, BA1, BS1, BP4, BP6, and BP7.</p>
        <p>Using machine-learning regression procedures, we normalized the weights for the evidence of different categories in accordance with the ACMG guidelines, assuming that the weight coefficient of PVS1 is 1, that of PS is 1/2, that of PM is 1/6, and that of PP is 1/12. We additionally assumed that the weight coefficient of BA1, BS, and BP is –1, –1/2, and –1/4, respectively. As the ACMG criteria were not originally designed for machine learning, these criteria are not true independent variables. Multicollinearity among feature vectors is commonly seen within each gene, which is the case for the PM1 and PP2 criteria. By definition, a PM1 hit means that the variant is located in a mutational hotspot or in a critical and well-established functional domain without benign variation, and a PP2 hit means that there is a missense variant in a gene that has a low rate of benign missense variation and in which missense variants are a common mechanism of disease. In many situations, PM1 and PP2 are consistent with each other, which increases the risk of inappropriate weighting of the two criteria because of multicollinearity. To detect the collinearity among feature vectors, we calculated the variance inflation factor (VIF) and pairwise correlation coefficient for the ACMG criteria. Feature vectors with a VIF greater than 10 or a correlation coefficient larger than 0.8 were removed before the learning procedures.</p>
      </sec>
      <sec>
        <title>Learning Procedures and Predictive Modeling</title>
        <p>The machine-learning procedure used in this study was a typical logistic regression based on the Scikit-learn package in Python [<xref ref-type="bibr" rid="ref16">16</xref>]. For detection of the weight matrix of the ACMG criteria, all variants, including P/LP and B/LB variants, were taken into account. For predictive modeling, we split the data based on 2-fold random shuffle processes. In other words, the P/LP and B/LB variants were split randomly into equally sized sets, with one set serving as training data and the other set serving as testing data, to determine the predictive capabilities of the model. This process was repeated 20 times to obtain the mean and standard deviation for accuracy measures, including sensitivity and specificity.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Variation in the Weight Matrix of ACMG Criteria Among the Three MODY Genes</title>
        <p>Based on the machine-learning procedure, we found that the weight matrix of the ACMG criteria was significantly different between the three MODY genes <italic>HNF1A</italic>, <italic>HNF4A,</italic> and <italic>GCK</italic> (<xref ref-type="table" rid="table1">Table 1</xref>, <xref rid="figure1" ref-type="fig">Figure 1</xref>). The differences are nontrivial and must be taken into consideration in clinical interpretation of DNA variants for genetic diagnosis.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Weight matrix of the American College of Medical Genetics and Genomics criteria for three maturity-onset diabetes of the young genes.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>Criteria</td>
                <td colspan="6">Frequency</td>
                <td colspan="3">Weight</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td><italic>HNF1A</italic> P/LP<sup>a</sup></td>
                <td><italic>HNF1A</italic> B/LB<sup>b</sup></td>
                <td><italic>HNF4A</italic> P/LP</td>
                <td><italic>HNF4A</italic> B/LB</td>
                <td><italic>GCK</italic> P/LP</td>
                <td><italic>GCK</italic> B/LB</td>
                <td>
                  <italic>HNF1A</italic>
                </td>
                <td>
                  <italic>HNF4A</italic>
                </td>
                <td>
                  <italic>GCK</italic>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>PVS1</td>
                <td>0.3040</td>
                <td>0.0030</td>
                <td>0.2582</td>
                <td>0.0000</td>
                <td>0.2183</td>
                <td>0.0033</td>
                <td>5.401</td>
                <td>11.665</td>
                <td>5.275</td>
              </tr>
              <tr valign="top">
                <td>PS1</td>
                <td>0.0018</td>
                <td>0.0000</td>
                <td>0.0000</td>
                <td>0.0000</td>
                <td>0.0039</td>
                <td>0.0000</td>
                <td>0.018</td>
                <td>0.000</td>
                <td>0.210</td>
              </tr>
              <tr valign="top">
                <td>PS4</td>
                <td>0.0000</td>
                <td>0.0030</td>
                <td>0.0000</td>
                <td>0.0000</td>
                <td>0.0000</td>
                <td>0.0000</td>
                <td>0.000</td>
                <td>0.000</td>
                <td>0.000</td>
              </tr>
              <tr valign="top">
                <td>PM1</td>
                <td>0.5149</td>
                <td>0.0030</td>
                <td>0.4835</td>
                <td>0.0000</td>
                <td>0.6326</td>
                <td>0.0083</td>
                <td>0.866</td>
                <td>2.340</td>
                <td>0.442</td>
              </tr>
              <tr valign="top">
                <td>PM2</td>
                <td>0.9772</td>
                <td>0.4273</td>
                <td>0.7802</td>
                <td>0.1450</td>
                <td>0.9922</td>
                <td>0.5092</td>
                <td>0.555</td>
                <td>0.290</td>
                <td>0.542</td>
              </tr>
              <tr valign="top">
                <td>PM4</td>
                <td>0.0053</td>
                <td>0.0000</td>
                <td>0.0055</td>
                <td>0.0000</td>
                <td>0.0049</td>
                <td>0.0000</td>
                <td>1.167</td>
                <td>1.944</td>
                <td>0.923</td>
              </tr>
              <tr valign="top">
                <td>PM5</td>
                <td>0.0264</td>
                <td>0.0000</td>
                <td>0.0055</td>
                <td>0.0000</td>
                <td>0.1335</td>
                <td>0.0000</td>
                <td>0.375</td>
                <td>0.007</td>
                <td>0.927</td>
              </tr>
              <tr valign="top">
                <td>PP2</td>
                <td>0.0000</td>
                <td>0.0000</td>
                <td>0.5440</td>
                <td>0.0012</td>
                <td>0.0000</td>
                <td>0.0000</td>
                <td>0.000</td>
                <td>0.000</td>
                <td>0.000</td>
              </tr>
              <tr valign="top">
                <td>PP3</td>
                <td>0.6151</td>
                <td>0.0061</td>
                <td>0.5769</td>
                <td>0.0000</td>
                <td>0.7437</td>
                <td>0.0050</td>
                <td>0.235</td>
                <td>0.000</td>
                <td>0.347</td>
              </tr>
              <tr valign="top">
                <td>PP5</td>
                <td>0.1195</td>
                <td>0.0000</td>
                <td>0.1923</td>
                <td>0.0000</td>
                <td>0.1540</td>
                <td>0.0033</td>
                <td>0.975</td>
                <td>1.727</td>
                <td>0.202</td>
              </tr>
              <tr valign="top">
                <td>BA1</td>
                <td>0.0105</td>
                <td>0.2091</td>
                <td>0.0165</td>
                <td>0.1708</td>
                <td>0.0039</td>
                <td>0.1703</td>
                <td>-0.696</td>
                <td>–0.880</td>
                <td>–1.312</td>
              </tr>
              <tr valign="top">
                <td>BS1</td>
                <td>0.0228</td>
                <td>0.5667</td>
                <td>0.0440</td>
                <td>0.5895</td>
                <td>0.0078</td>
                <td>0.4891</td>
                <td>0.000</td>
                <td>0.000</td>
                <td>0.000</td>
              </tr>
              <tr valign="top">
                <td>BP4</td>
                <td>0.0193</td>
                <td>0.0727</td>
                <td>0.0165</td>
                <td>0.0222</td>
                <td>0.0458</td>
                <td>0.0234</td>
                <td>0.000</td>
                <td>0.000</td>
                <td>–0.665</td>
              </tr>
              <tr valign="top">
                <td>BP6</td>
                <td>0.0123</td>
                <td>0.1182</td>
                <td>0.0220</td>
                <td>0.0480</td>
                <td>0.0029</td>
                <td>0.0234</td>
                <td>0.000</td>
                <td>0.000</td>
                <td>–0.253</td>
              </tr>
              <tr valign="top">
                <td>BP7</td>
                <td>0.0123</td>
                <td>0.0636</td>
                <td>0.0110</td>
                <td>0.0211</td>
                <td>0.0400</td>
                <td>0.0200</td>
                <td>0.000</td>
                <td>0.000</td>
                <td>0.000</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>P/LP: pathogenic/likely pathogenic variant.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>B/LB: benign/likely benign variant.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Weight matrix of three MODY genes, HNF1A, HNF4A and GCK: normalized weight for American College of Medical Genetics and Genomics criteria for three most common maturity-onset diabetes of the young genes.</p>
          </caption>
          <graphic xlink:href="biomedeng_v5i1e20506_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Evidence for PS is rarely observed for the MODY variants. By contrast, evidence for PS4 (ie, the prevalence of the variant in affected individuals is significantly increased compared with the prevalence in controls) is commonly observed but is often misclassified. As an example, the <italic>HNF1A</italic> variant 12:121420807-G-A (rs1183910) was reported to be associated with C-reactive protein, a marker of inflammation, in a genome-wide association study [<xref ref-type="bibr" rid="ref17">17</xref>]. However, as a common single nucleotide polymorphism with a minor allele frequency of 0.292 in European populations, this cannot be a variant causing the rare and dominantly inherited form of <italic>HNF1A</italic>-MODY.</p>
        <p>With respect to evidence for PM criteria, PM1, which is defined as a variant located in a mutational hotspot or in a critical and well-established functional domain (eg, active site of an enzyme) without benign variation, and PM2 (absent from controls or at extremely low frequency if recessive in Exome Sequencing Project, 1000 Genomes Project, or Exome Aggregation Consortium) are both commonly observed, in support of pathogenic variants in the three MODY genes. However, PM2 is also commonly seen among B/LB variants in these three genes, thus lacking specificity for functional classification. In this study, PM2 showed a VIF of 79.0 in <italic>HNF1A</italic> and a VIF of 247 in <italic>GCK</italic>. Therefore, although PM2 is much more common than PM1 for the three MODY genes, the weight of PM2 in <italic>HNF1A</italic> is lower than that of PM1.</p>
        <p>With respect to the evidence for PP criteria, PP2 (missense variant in a gene that has a low rate of benign missense variation and in which missense variants are a common mechanism of disease) is absent in <italic>HNF1A</italic> and <italic>GCK</italic>, but is commonly seen in <italic>HNF4A</italic>. However, PP2 showed a correlation coefficient of 0.932 with PM1, and therefore does not add substantial weight to the classification of P/LP variants in <italic>HNF4A</italic>.</p>
      </sec>
      <sec>
        <title>Highly Accurate Predictive Ability for MODY Gene Pathogenicity</title>
        <p><italic>HNF4A</italic>-MODY (MODY1), <italic>GCK</italic>-MODY (MODY2), and <italic>HNF1A</italic>-MODY (MODY3) are the three most common types of MODYs, accounting for ~70% of all MODY genes [<xref ref-type="bibr" rid="ref18">18</xref>]. Therefore, a predictive model that can accurately recognize pathogenic variants would be useful for the diagnosis of novel mutations in these genes. As described in the Methods section, we used 2-fold random shuffle testing with 50% of the 3600 mutations as training data and the other 50% as testing data, and repeated the analysis 20 times. The logistic regression machine-learning model showed overall accuracy above 95% (1676/1786) for MODY gene mutations (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Both <italic>HNF1A</italic> (true negatives=163, false positives=2) and <italic>HNF4A</italic> (true negatives=428, false positives=0) had a specificity close to 100%, and the specificity in <italic>GCK</italic> was also above 95% (true negatives=289, false positives=10). This lower specificity is also consistent with the benign phenotype and mild clinical expression of <italic>GCK</italic>-MODY.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Overall accuracy based on logistic regression machine learning. The boxplot represents the sensitivity and specificity for 2-fold random shuffle tests.</p>
          </caption>
          <graphic xlink:href="biomedeng_v5i1e20506_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>These results proved the principle that ACMG criteria could be applied as meaningful feature vectors in a machine-learning model, and such a model based on ACMG criteria could provide accurate pathogenic classification for other Mendelian disease genes in a gene-specific manner.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>Our results highlight the need for applying different weights of the ACMG criteria in the functional classification of DNA variants of different MODY genes. In the past decade, sequencing technologies have evolved rapidly with the advance of high-throughput next-generation sequencing (NGS). By adopting NGS, clinical laboratories are now performing an ever-increasing volume of genetic testing for genetic disorders. However, increased complexity in genetic testing has been accompanied by new challenges in sequence interpretation, and multiple new standards have been implemented for physicians and genetic counselors regarding the interpretation and reporting of sequence variants at different levels of pathogenicity. Currently, there are multiple computational tools available based on different algorithms and databases that are being used to predict the pathogenicity of DNA variants, such as SIFT [<xref ref-type="bibr" rid="ref19">19</xref>], MutationTaster [<xref ref-type="bibr" rid="ref20">20</xref>], likelihood ratio test [<xref ref-type="bibr" rid="ref21">21</xref>], FATHMM by a supervised machine-learning model [<xref ref-type="bibr" rid="ref22">22</xref>], GERP++ by maximum-likelihood evolutionary rate estimation [<xref ref-type="bibr" rid="ref23">23</xref>] for coding variants, and DANN for both coding and noncoding variants using a deep neural network [<xref ref-type="bibr" rid="ref24">24</xref>]. However, all of these computational tools assess each gene with a common rule, which is not based on biology, whereas this study proposes that a gene-specific assessment for pathogenicity is required, at least for MODY genes [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
      <p>The evolutionary selection pressures on MODYs vary across different genes, and is considered to be the lowest in the case of <italic>GCK</italic>-MODY [<xref ref-type="bibr" rid="ref25">25</xref>]. Similar issues exist with functional classification based on the ACMG criteria, which are globally applied for all human genes. The ACMG criteria contain 33 terms that lead to five categories of mutations (“pathogenic,” “likely pathogenic,” “uncertain significance,” “likely benign,” and “benign”), as one of the most commonly used standards.</p>
      <p>MODY represents a group of dominantly inherited monogenic diabetes, and <italic>HNF4A</italic>-MODY (MODY1), <italic>GCK</italic>-MODY (MODY2), and <italic>HNF1A</italic>-MODY (MODY3) are the three most common subtypes of MODY. These MODY genes are involved in different molecular pathways. MODY variants of different genes show different clinical features and thus require different treatments. For example, <italic>HNF1A</italic>-MODY is characterized by a reduced beta cell mass or impaired function, and has been treated with sulfonylureas for decades with excellent results [<xref ref-type="bibr" rid="ref26">26</xref>]. Patients with <italic>HNF1A</italic>-MODY are highly sensitive to sulfonylurea treatment and may be susceptible to developing hypoglycemia during the treatment [<xref ref-type="bibr" rid="ref26">26</xref>]. <italic>HNF4A</italic>-MODY has similar clinical features with <italic>HNF1A</italic>-MODY, and the affected transcription network plays a role in the early development of the pancreas. The pancreatic beta cells produce adequate insulin in infancy but the capacity for insulin production declines thereafter [<xref ref-type="bibr" rid="ref27">27</xref>]. The beta cells in <italic>GCK</italic>-MODY have a normal capacity to make and secrete insulin, but do so only above an abnormally high glucose threshold, which results in a chronic, mild increase in blood sugar that is usually asymptomatic [<xref ref-type="bibr" rid="ref25">25</xref>]. Accordingly, treatment of <italic>GCK</italic>-MODY can be achieved by a healthy diet and exercise, while oral hypoglycemic agents or insulin is of no benefit for these patients [<xref ref-type="bibr" rid="ref25">25</xref>]. Therefore, accurate molecular diagnosis of these MODYs is important for precise treatment.</p>
      <p>In conclusion, we applied a computational machine-learning method together with the ACMG criteria for functional classification of genetic variants of the three most common MODY genes, <italic>HNF1A</italic>, <italic>HNF4A</italic> and <italic>GCK.</italic> Our results show that a typical machine-learning model using 15 computational ACMG criteria as the feature vector has predictive abilities that are highly accurate (&gt;95% accuracy) for hundreds of annotated variants in three MODY genes. Therefore, this model could serve as a fast, gene-specific method for physicians or genetic counselors assisting with diagnosis and reporting, especially when confronted by contradictory ACMG criteria. Moreover, we show that the weight of the ACMG criteria exhibits gene specificity, which advocates for the application of machine-learning methods with the ACMG criteria to capture the most relevant information for each disease-related variant.</p>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACMG</term>
          <def>
            <p>American College of Medical Genetics and Genomics</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">B/LB</term>
          <def>
            <p>benign/likely benign</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HGMD</term>
          <def>
            <p>Human Gene Mutation Database</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MODY</term>
          <def>
            <p>maturity-onset diabetes of the young</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NGS</term>
          <def>
            <p>next-generation sequencing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">P/LP</term>
          <def>
            <p>pathogenic/likely pathogenic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">VIF</term>
          <def>
            <p>variance inflation factor</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The study was supported by Institutional Development Funds from the Children’s Hospital of Philadelphia to the Center for Applied Genomics, and The Children’s Hospital of Philadelphia Endowed Chair in Genomic Research to HH. We thank the Center for Applied Genomics staff and support from Children’s Hospital of Philadelphia.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>YL and HQ conceptualized and designed the study, drafted the initial manuscript, and reviewed and revised the manuscript. AW, JQ, XC, JG, PS, and LT collected data, carried out the initial analyses, and reviewed and revised the manuscript. HH conceptualized and designed the study, and critically reviewed the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <source>National Institute of Diabetes and Digestive and Kidney Diseases</source>
          <access-date>2020-05-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.niddk.nih.gov/health-information/diabetes/overview/what-is-diabetes/monogenic-neonatal-mellitus-mody">https://www.niddk.nih.gov/health-information/diabetes/overview/what-is-diabetes/monogenic-neonatal-mellitus-mody</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shields</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Hicks</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shepherd</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Colclough</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hattersley</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Ellard</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Maturity-onset diabetes of the young (MODY): how many cases are we missing?</article-title>
          <source>Diabetologia</source>
          <year>2010</year>
          <month>12</month>
          <day>25</day>
          <volume>53</volume>
          <issue>12</issue>
          <fpage>2504</fpage>
          <lpage>2508</lpage>
          <pub-id pub-id-type="doi">10.1007/s00125-010-1799-4</pub-id>
          <pub-id pub-id-type="medline">20499044</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rubio-Cabezas</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Hattersley</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Njølstad</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Mlynarski</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ellard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Craig</surname>
              <given-names>ME</given-names>
            </name>
            <collab>International Society for Pediatric Adolescent Diabetes</collab>
          </person-group>
          <article-title>ISPAD Clinical Practice Consensus Guidelines 2014. The diagnosis and management of monogenic diabetes in children and adolescents</article-title>
          <source>Pediatr Diabetes</source>
          <year>2014</year>
          <month>09</month>
          <day>03</day>
          <volume>15</volume>
          <issue>Suppl 20</issue>
          <fpage>47</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1111/pedi.12192</pub-id>
          <pub-id pub-id-type="medline">25182307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Richards</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aziz</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bale</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bick</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gastier-Foster</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grody</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Hegde</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lyon</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Spector</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Voelkerding</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rehm</surname>
              <given-names>HL</given-names>
            </name>
            <collab>ACMG Laboratory Quality Assurance Committee</collab>
          </person-group>
          <article-title>Standards and guidelines for the interpretation of sequence variants: a joint consensus recommendation of the American College of Medical Genetics and Genomics and the Association for Molecular Pathology</article-title>
          <source>Genet Med</source>
          <year>2015</year>
          <month>05</month>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>405</fpage>
          <lpage>424</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25741868"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/gim.2015.30</pub-id>
          <pub-id pub-id-type="medline">25741868</pub-id>
          <pub-id pub-id-type="pii">gim201530</pub-id>
          <pub-id pub-id-type="pmcid">PMC4544753</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gibbs</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Boerwinkle</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Polychronakos</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Qu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Gene-specific function prediction for non-synonymous mutations in monogenic diabetes genes</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>e104452</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0104452"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0104452</pub-id>
          <pub-id pub-id-type="medline">25136813</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-22072</pub-id>
          <pub-id pub-id-type="pmcid">PMC4138110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hakonarson</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Application of ACMG criteria to classify variants in the human gene mutation database</article-title>
          <source>J Hum Genet</source>
          <year>2019</year>
          <month>11</month>
          <day>26</day>
          <volume>64</volume>
          <issue>11</issue>
          <fpage>1091</fpage>
          <lpage>1095</lpage>
          <pub-id pub-id-type="doi">10.1038/s10038-019-0663-8</pub-id>
          <pub-id pub-id-type="medline">31451714</pub-id>
          <pub-id pub-id-type="pii">10.1038/s10038-019-0663-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Phung</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karmakar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shilton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yearwood</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dimitrova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Venkatesh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berk</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Guidelines for Developing and Reporting Machine Learning Predictive Models in Biomedical Research: A Multidisciplinary View</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <month>12</month>
          <day>16</day>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>e323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/12/e323/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id>
          <pub-id pub-id-type="medline">27986644</pub-id>
          <pub-id pub-id-type="pii">v18i12e323</pub-id>
          <pub-id pub-id-type="pmcid">PMC5238707</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pande</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mohapatra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Nicorici</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Machine Learning to Improve Energy Expenditure Estimation in Children With Disabilities: A Pilot Study in Duchenne Muscular Dystrophy</article-title>
          <source>JMIR Rehabil Assist Technol</source>
          <year>2016</year>
          <month>07</month>
          <day>19</day>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>e7</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://rehab.jmir.org/2016/2/e7/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/rehab.4340</pub-id>
          <pub-id pub-id-type="medline">28582264</pub-id>
          <pub-id pub-id-type="pii">v3i2e7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5454548</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pihoker</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gilliam</surname>
              <given-names>LK</given-names>
            </name>
            <name name-style="western">
              <surname>Ellard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dabelea</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dolan</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Greenbaum</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Imperatore</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lawrence</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Marcovina</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer-Davis</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Steck</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Hattersley</surname>
              <given-names>AT</given-names>
            </name>
            <collab>SEARCH for Diabetes in Youth Study Group</collab>
          </person-group>
          <article-title>Prevalence, characteristics and clinical diagnosis of maturity onset diabetes of the young due to mutations in HNF1A, HNF4A, and glucokinase: results from the SEARCH for Diabetes in Youth</article-title>
          <source>J Clin Endocrinol Metab</source>
          <year>2013</year>
          <month>10</month>
          <volume>98</volume>
          <issue>10</issue>
          <fpage>4055</fpage>
          <lpage>4062</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23771925"/>
          </comment>
          <pub-id pub-id-type="doi">10.1210/jc.2013-1279</pub-id>
          <pub-id pub-id-type="medline">23771925</pub-id>
          <pub-id pub-id-type="pii">jc.2013-1279</pub-id>
          <pub-id pub-id-type="pmcid">PMC3790621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sherry</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Kholodov</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Phan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Smigielski</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Sirotkin</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>dbSNP: the NCBI database of genetic variation</article-title>
          <source>Nucleic Acids Res</source>
          <year>2001</year>
          <month>01</month>
          <day>01</day>
          <volume>29</volume>
          <issue>1</issue>
          <fpage>308</fpage>
          <lpage>311</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/11125122"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/29.1.308</pub-id>
          <pub-id pub-id-type="medline">11125122</pub-id>
          <pub-id pub-id-type="pmcid">PMC29783</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Landrum</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Jang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rubinstein</surname>
              <given-names>WS</given-names>
            </name>
            <name name-style="western">
              <surname>Church</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Maglott</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>ClinVar: public archive of relationships among sequence variation and human phenotype</article-title>
          <source>Nucleic Acids Res</source>
          <year>2014</year>
          <month>01</month>
          <volume>42</volume>
          <issue>Database issue</issue>
          <fpage>D980</fpage>
          <lpage>D985</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24234437"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkt1113</pub-id>
          <pub-id pub-id-type="medline">24234437</pub-id>
          <pub-id pub-id-type="pii">gkt1113</pub-id>
          <pub-id pub-id-type="pmcid">PMC3965032</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stenson</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Mort</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hayden</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Heywood</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>DN</given-names>
            </name>
          </person-group>
          <article-title>The Human Gene Mutation Database: towards a comprehensive repository of inherited mutation data for medical research, genetic diagnosis and next-generation sequencing studies</article-title>
          <source>Hum Genet</source>
          <year>2017</year>
          <month>06</month>
          <volume>136</volume>
          <issue>6</issue>
          <fpage>665</fpage>
          <lpage>677</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28349240"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00439-017-1779-6</pub-id>
          <pub-id pub-id-type="medline">28349240</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00439-017-1779-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC5429360</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <source>Human Gene Mutation Database</source>
          <access-date>2020-05-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.hgmd.cf.ac.uk/docs/new_back.html">http://www.hgmd.cf.ac.uk/docs/new_back.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bahcall</surname>
              <given-names>OG</given-names>
            </name>
          </person-group>
          <article-title>Genetic testing. ACMG guides on the interpretation of sequence variants</article-title>
          <source>Nat Rev Genet</source>
          <year>2015</year>
          <month>05</month>
          <volume>16</volume>
          <issue>5</issue>
          <fpage>256</fpage>
          <lpage>257</lpage>
          <pub-id pub-id-type="doi">10.1038/nrg3940</pub-id>
          <pub-id pub-id-type="medline">25854183</pub-id>
          <pub-id pub-id-type="pii">nrg3940</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>InterVar: Clinical Interpretation of Genetic Variants by the 2015 ACMG-AMP Guidelines</article-title>
          <source>Am J Hum Genet</source>
          <year>2017</year>
          <month>02</month>
          <day>02</day>
          <volume>100</volume>
          <issue>2</issue>
          <fpage>267</fpage>
          <lpage>280</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0002-9297(17)30004-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ajhg.2017.01.004</pub-id>
          <pub-id pub-id-type="medline">28132688</pub-id>
          <pub-id pub-id-type="pii">S0002-9297(17)30004-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC5294755</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vincent</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: Machine learning in Python</article-title>
          <source>J Machine Learn Res</source>
          <year>2011</year>
          <volume>12</volume>
          <fpage>2825</fpage>
          <lpage>2830</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ligthart</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vaez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>Y</given-names>
            </name>
            <collab>Inflammation Working Group of the CHARGE Consortium</collab>
            <collab>PMI-WG-XCP</collab>
            <collab>LifeLines Cohort Study</collab>
            <name name-style="western">
              <surname>Stolk</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Uitterlinden</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Hofman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alizadeh</surname>
              <given-names>BZ</given-names>
            </name>
            <name name-style="western">
              <surname>Franco</surname>
              <given-names>OH</given-names>
            </name>
            <name name-style="western">
              <surname>Dehghan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Bivariate genome-wide association study identifies novel pleiotropic loci for lipids and inflammation</article-title>
          <source>BMC Genomics</source>
          <year>2016</year>
          <month>06</month>
          <day>10</day>
          <volume>17</volume>
          <fpage>443</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcgenomics.biomedcentral.com/articles/10.1186/s12864-016-2712-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12864-016-2712-4</pub-id>
          <pub-id pub-id-type="medline">27286809</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12864-016-2712-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC4901478</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ellard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bellanné-Chantelot</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hattersley</surname>
              <given-names>AT</given-names>
            </name>
            <collab>European Molecular Genetics Quality Network (EMQN) MODY group</collab>
          </person-group>
          <article-title>Best practice guidelines for the molecular genetic diagnosis of maturity-onset diabetes of the young</article-title>
          <source>Diabetologia</source>
          <year>2008</year>
          <month>04</month>
          <day>23</day>
          <volume>51</volume>
          <issue>4</issue>
          <fpage>546</fpage>
          <lpage>553</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18297260"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00125-008-0942-y</pub-id>
          <pub-id pub-id-type="medline">18297260</pub-id>
          <pub-id pub-id-type="pmcid">PMC2270360</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Henikoff</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>SIFT: Predicting amino acid changes that affect protein function</article-title>
          <source>Nucleic Acids Res</source>
          <year>2003</year>
          <month>07</month>
          <day>01</day>
          <volume>31</volume>
          <issue>13</issue>
          <fpage>3812</fpage>
          <lpage>3814</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/12824425"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkg509</pub-id>
          <pub-id pub-id-type="medline">12824425</pub-id>
          <pub-id pub-id-type="pmcid">PMC168916</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwarz</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>DN</given-names>
            </name>
            <name name-style="western">
              <surname>Schuelke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Seelow</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>MutationTaster2: mutation prediction for the deep-sequencing age</article-title>
          <source>Nat Methods</source>
          <year>2014</year>
          <month>04</month>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>361</fpage>
          <lpage>362</lpage>
          <pub-id pub-id-type="doi">10.1038/nmeth.2890</pub-id>
          <pub-id pub-id-type="medline">24681721</pub-id>
          <pub-id pub-id-type="pii">nmeth.2890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chun</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fay</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Identification of deleterious mutations within three human genomes</article-title>
          <source>Genome Res</source>
          <year>2009</year>
          <month>09</month>
          <volume>19</volume>
          <issue>9</issue>
          <fpage>1553</fpage>
          <lpage>1561</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://genome.cshlp.org/cgi/pmidlookup?view=long&amp;pmid=19602639"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/gr.092619.109</pub-id>
          <pub-id pub-id-type="medline">19602639</pub-id>
          <pub-id pub-id-type="pii">gr.092619.109</pub-id>
          <pub-id pub-id-type="pmcid">PMC2752137</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Shihab</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Mort</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>DN</given-names>
            </name>
            <name name-style="western">
              <surname>Gaunt</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>FATHMM-XF: accurate prediction of pathogenic point mutations via extended features</article-title>
          <source>Bioinformatics</source>
          <year>2018</year>
          <month>02</month>
          <day>01</day>
          <volume>34</volume>
          <issue>3</issue>
          <fpage>511</fpage>
          <lpage>513</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28968714"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btx536</pub-id>
          <pub-id pub-id-type="medline">28968714</pub-id>
          <pub-id pub-id-type="pii">4104409</pub-id>
          <pub-id pub-id-type="pmcid">PMC5860356</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davydov</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Goode</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sirota</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sidow</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Batzoglou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Identifying a high fraction of the human genome to be under selective constraint using GERP++</article-title>
          <source>PLoS Comput Biol</source>
          <year>2010</year>
          <month>12</month>
          <day>02</day>
          <volume>6</volume>
          <issue>12</issue>
          <fpage>e1001025</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pcbi.1001025"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pcbi.1001025</pub-id>
          <pub-id pub-id-type="medline">21152010</pub-id>
          <pub-id pub-id-type="pmcid">PMC2996323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Quang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>DANN: a deep learning approach for annotating the pathogenicity of genetic variants</article-title>
          <source>Bioinformatics</source>
          <year>2015</year>
          <month>03</month>
          <day>01</day>
          <volume>31</volume>
          <issue>5</issue>
          <fpage>761</fpage>
          <lpage>763</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25338716"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btu703</pub-id>
          <pub-id pub-id-type="medline">25338716</pub-id>
          <pub-id pub-id-type="pii">btu703</pub-id>
          <pub-id pub-id-type="pmcid">PMC4341060</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chakera</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Steele</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Gloyn</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Shepherd</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Shields</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ellard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hattersley</surname>
              <given-names>AT</given-names>
            </name>
          </person-group>
          <article-title>Recognition and Management of Individuals With Hyperglycemia Because of a Heterozygous Glucokinase Mutation</article-title>
          <source>Diabetes Care</source>
          <year>2015</year>
          <month>07</month>
          <day>23</day>
          <volume>38</volume>
          <issue>7</issue>
          <fpage>1383</fpage>
          <lpage>1392</lpage>
          <pub-id pub-id-type="doi">10.2337/dc14-2769</pub-id>
          <pub-id pub-id-type="medline">26106223</pub-id>
          <pub-id pub-id-type="pii">38/7/1383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pearson</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Starkey</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Powell</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gribble</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Hattersley</surname>
              <given-names>AT</given-names>
            </name>
          </person-group>
          <article-title>Genetic cause of hyperglycaemia and response to treatment in diabetes</article-title>
          <source>Lancet</source>
          <year>2003</year>
          <month>10</month>
          <day>18</day>
          <volume>362</volume>
          <issue>9392</issue>
          <fpage>1275</fpage>
          <lpage>1281</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(03)14571-0</pub-id>
          <pub-id pub-id-type="medline">14575972</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(03)14571-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Odom</surname>
              <given-names>DT</given-names>
            </name>
            <name name-style="western">
              <surname>Zizlsperger</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Rinaldi</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Volkert</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Schreiber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rolfe</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Gifford</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Fraenkel</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>GI</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Control of pancreas and liver gene expression by HNF transcription factors</article-title>
          <source>Science</source>
          <year>2004</year>
          <month>02</month>
          <day>27</day>
          <volume>303</volume>
          <issue>5662</issue>
          <fpage>1378</fpage>
          <lpage>1381</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.sciencemag.org/cgi/pmidlookup?view=long&amp;pmid=14988562"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.1089769</pub-id>
          <pub-id pub-id-type="medline">14988562</pub-id>
          <pub-id pub-id-type="pii">303/5662/1378</pub-id>
          <pub-id pub-id-type="pmcid">PMC3012624</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
