<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JBB</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Bioinformatics Biotechnol</journal-id>
      <journal-title>JMIR Bioinformatics and Biotechnology</journal-title>
      <issn pub-type="epub">2563-3570</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v2i1e25995</article-id>
      <article-id pub-id-type="pmid">33497425</article-id>
      <article-id pub-id-type="doi">10.2196/25995</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Isolating SARS-CoV-2 Strains From Countries in the Same Meridian: Genome Evolutionary Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pappalardo</surname>
            <given-names>Francesco</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Motta</surname>
            <given-names>Santo</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Mastriani</surname>
            <given-names>Emilio</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>HMU-UCCSM Centre for Infection and Genomics</institution>
            <institution>Harbin Medical University</institution>
            <addr-line>No 157, Baojian Road</addr-line>
            <addr-line>Harbin, 150081</addr-line>
            <country>China</country>
            <phone>86 13664502721 ext 64502721</phone>
            <email>emiliomastriani@icloud.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5434-2546</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Rakov</surname>
            <given-names>Alexey V</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1917-9189</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Shu-Lin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6883-6037</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Systemomics Center, College of Pharmacy, Genomics Research Center</institution>
        <institution>State-Province Key Laboratories of Biomedicine-Pharmaceutics of China</institution>
        <institution>Harbin Medical University</institution>
        <addr-line>Harbin</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>HMU-UCCSM Centre for Infection and Genomics</institution>
        <institution>Harbin Medical University</institution>
        <addr-line>Harbin</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Somov Institute of Epidemiology and Microbiology</institution>
        <addr-line>Vladivostok</addr-line>
        <country>Russian Federation</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Microbiology, Immunology and Infectious Diseases</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Emilio Mastriani <email>emiliomastriani@icloud.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jan-Dec</season>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>22</day>
        <month>1</month>
        <year>2021</year>
      </pub-date>
      <volume>2</volume>
      <issue>1</issue>
      <elocation-id>e25995</elocation-id>
      <history>
        <date date-type="received">
          <day>23</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>14</day>
          <month>12</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>12</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>13</day>
          <month>1</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Emilio Mastriani, Alexey V Rakov, Shu-Lin Liu. Originally published in JMIR Research Protocols (http://www.researchprotocols.org), 22.01.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on http://bioinform.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://bioinform.jmir.org/2021/1/e25995/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>COVID-19, caused by the novel SARS-CoV-2, is considered the most threatening respiratory infection in the world, with over 40 million people infected and over 0.934 million related deaths reported worldwide. It is speculated that epidemiological and clinical features of COVID-19 may differ across countries or continents. Genomic comparison of 48,635 SARS-CoV-2 genomes has shown that the average number of mutations per sample was 7.23, and most SARS-CoV-2 strains belong to one of 3 clades characterized by geographic and genomic specificity: Europe, Asia, and North America.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to compare the genomes of SARS-CoV-2 strains isolated from Italy, Sweden, and Congo, that is, 3 different countries in the same meridian (longitude) but with different climate conditions, and from Brazil (as an outgroup country), to analyze similarities or differences in patterns of possible evolutionary pressure signatures in their genomes.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We obtained data from the Global Initiative on Sharing All Influenza Data repository by sampling all genomes available on that date. Using HyPhy, we achieved the recombination analysis by genetic algorithm recombination detection method, trimming, removal of the stop codons, and phylogenetic tree and mixed effects model of evolution analyses. We also performed secondary structure prediction analysis for both sequences (mutated and wild-type) and “disorder” and “transmembrane” analyses of the protein. We analyzed both protein structures with an ab initio approach to predict their ontologies and 3D structures.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Evolutionary analysis revealed that codon 9628 is under episodic selective pressure for all SARS-CoV-2 strains isolated from the 4 countries, suggesting it is a key site for virus evolution. Codon 9628 encodes the P0DTD3 (Y14_SARS2) uncharacterized protein 14. Further investigation showed that the codon mutation was responsible for helical modification in the secondary structure. The codon was positioned in the more ordered region of the gene (41-59) and near to the area acting as the transmembrane (54-67), suggesting its involvement in the attachment phase of the virus. The predicted protein structures of both wild-type and mutated P0DTD3 confirmed the importance of the codon to define the protein structure. Moreover, ontological analysis of the protein emphasized that the mutation enhances the binding probability.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our results suggest that RNA secondary structure may be affected and, consequently, the protein product changes T (threonine) to G (glycine) in position 50 of the protein. This position is located close to the predicted transmembrane region. Mutation analysis revealed that the change from G (glycine) to D (aspartic acid) may confer a new function to the protein—binding activity, which in turn may be responsible for attaching the virus to human eukaryotic cells. These findings can help design in vitro experiments and possibly facilitate a vaccine design and successful antiviral strategies.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>SARS-CoV-2</kwd>
        <kwd>evolutionary analysis</kwd>
        <kwd>episodic selective pressure</kwd>
        <kwd>virus evolution</kwd>
        <kwd>codon mutation</kwd>
        <kwd>binding probability</kwd>
        <kwd>evolution</kwd>
        <kwd>genome</kwd>
        <kwd>genetics</kwd>
        <kwd>COVID-19</kwd>
        <kwd>virus</kwd>
        <kwd>strain</kwd>
        <kwd>codon</kwd>
        <kwd>pressure</kwd>
        <kwd>mutation</kwd>
        <kwd>structure</kwd>
        <kwd>prediction</kwd>
        <kwd>protein</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The ongoing COVID-19 pandemic caused by the novel SARS-CoV-2 is the most threatening respiratory infection worldwide and has affected almost every country in the world. As of December 30, 2020, over 81 million people were infected with COVID-19, and more than 1.7 million deaths were reported. Many health institutions are attempting to produce effective vaccines against this virus infection, and several are now in the final stages of development before their application to human populations [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>The SARS-CoV-2 genome shares approximately 82% sequence identity with SARS-CoV and MERS-CoV (Middle East respiratory syndrome coronavirus) and more than 90% sequence identity for essential enzymes and structural proteins. This high level of sequence identity suggests a common pathogenesis mechanism and, thus, therapeutic targeting. SARS-CoV-2 contains 4 structural proteins, including spike (S), envelope (E), membrane (M), and nucleocapsid (N) proteins [<xref ref-type="bibr" rid="ref3">3</xref>]. The structure and the genome of SARS-CoV-2 are being extensively studied, but the results seem to be controversial. For example, a recent study found that the 2 integral membrane proteins (ie, envelope and membrane proteins) tend to evolve slowly by accumulating nucleotide mutations on their corresponding genes, but genes encoding nucleocapsid, viral replicase and spike proteins, which are regarded as important targets for the development of vaccines and antiviral drugs, tend to evolve faster [<xref ref-type="bibr" rid="ref4">4</xref>]. However, other studies have shown that potential drug targets of SARS-CoV-2 are highly conserved [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>The genome of SARS-CoV-2 is comprised of a single-stranded positive-sense RNA. A newly sequenced genome of SARS-CoV-2 was submitted to the NCBI genome database (NC_045512.2). The genetic makeup of SARS-CoV-2 is composed of 13-15 (including 12 functional) open reading frames (ORFs) containing ~30,000 nucleotides. The genome contains 38% of GC content and 11 protein-coding genes, together expressing 12 proteins [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>The genomic characterization of 95 SARS-CoV-2 genomes revealed the 2 most common mutations that might affect the severity and spread of SARS-CoV-2 [<xref ref-type="bibr" rid="ref5">5</xref>]. Another study highlighted the crucial genomic features that are unique to SARS-CoV-2 and 2 other deadly coronaviruses, SARS-CoV and MERS-CoV. These unique features correlate with the high fatality rate due to infection with these coronaviruses as well as their ability to switch hosts from animals to humans [<xref ref-type="bibr" rid="ref6">6</xref>]. As a result, it can be speculated that the epidemiological and clinical features of these viruses may differ across countries or continents.</p>
      <p>Genomic comparison of 48,635 SARS-CoV-2 genomes has shown that the average number of mutations per sample was 7.23, and most SARS-CoV-2 strains belong to one of the following 3 clades characterized by geographic and genomic specificity: clade G (Europe), clade L (Asia), and G-derived clade (North America) [<xref ref-type="bibr" rid="ref7">7</xref>]. These results suggest custom-designed antiviral strategies based on the molecular specificities of SARS-CoV-2 in patients from different geographies [<xref ref-type="bibr" rid="ref7">7</xref>]. Previous studies have also differentiated the 3 variants according to the geographic location (East Asia, Europe, and America) [<xref ref-type="bibr" rid="ref8">8</xref>]. A more recent genome-wide analysis revealed that the frequency of amino acid mutations was higher in the genome sequences of SARS-CoV-2 strains from Europe (43.07%), followed by strains from Asia (38.09%) and North America (29.64%). However, case fatality rates remained higher in the European temperate countries, such as Italy, Spain, Netherlands, France, England, and Belgium [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>The aim of this study was to compare the set of SARS-CoV-2 genomes of viral strains isolated from representative countries in the same meridian (longitude), namely, Italy, Sweden, and Congo, which have different climate conditions, to reveal similarities or differences in the patterns of possible evolutionary pressure signatures in their genomes.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Sequence Data</title>
        <p>We obtained data from the Global Initiative on Sharing All Influenza Data (GISaid) repository and sampled all genomes available therein to that date (May 5, 2020), including the files congo-gisaid_hcov-19_2020_05_05_09.fasta with 75 entries, italy-gisaid_hcov-19_2020_05_05_10.fasta with 69 entries, sweden-gisaid_hcov-19_2020_05_05_10.fasta with 104 entries, and also the outgroup file brazil_gisaid_hcov-19_2020_05_15_04.fasta with 92 entries. The reference genome with accession number NC_045512.2 was downloaded from the GenBank repository.</p>
      </sec>
      <sec>
        <title>Evolution Model Analysis</title>
        <p>We used the SARS-CoV-2 Wuhan-Hu-1 genome (RefSeq Acc. No. NC_045512.2) as the reference sequence and the VIRULIGN version 1.0.1 application [<xref ref-type="bibr" rid="ref10">10</xref>] to perform multiple sequence alignment, with AliView version 1.26 application for visualizing the results of the analyses [<xref ref-type="bibr" rid="ref11">11</xref>]. HyPhy 2.5.8 (MP) was used to perform recombination analysis by the genetic algorithm recombination detection method and conduct trimming, stop codon removal, and phylogenetic tree and mixed effects model of evolution (MEME) analyses [<xref ref-type="bibr" rid="ref12">12</xref>]. The MEME web site was used to read JSON output files and generate MEME images and tables.</p>
      </sec>
      <sec>
        <title>RNA Secondary Structure Prediction</title>
        <p>We used the RNA_fold web server (part of the Vienna RNA Websuite) to predict secondary structures of both the wild-type and mutated sequences [<xref ref-type="bibr" rid="ref13">13</xref>], and the Forna package [<xref ref-type="bibr" rid="ref14">14</xref>] to build the graph diagrams.</p>
      </sec>
      <sec>
        <title>Protein Analysis</title>
        <p>Protein disorder analysis was conducted using MFDp2 [<xref ref-type="bibr" rid="ref15">15</xref>], NetSurfP-2.0 [<xref ref-type="bibr" rid="ref16">16</xref>], and SPOT-Disorder2 [<xref ref-type="bibr" rid="ref17">17</xref>] applications. Transmembrane analysis of the protein was calculated using the TMHMM server v.2.0, MemBrain webserver [<xref ref-type="bibr" rid="ref18">18</xref>], ProtScale [<xref ref-type="bibr" rid="ref19">19</xref>], and TMpred [<xref ref-type="bibr" rid="ref20">20</xref>] (scores normalized for comparison) on the Expasy website [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      </sec>
      <sec>
        <title>3D Protein Structure Prediction and Ontologies</title>
        <p>Both protein structures were determined with an ab initio approach by using the Robetta webserver [<xref ref-type="bibr" rid="ref22">22</xref>], whereas DeeProtein capsule from OCEAN CODE [<xref ref-type="bibr" rid="ref23">23</xref>] was used to predict ontologies of the predicted proteins. 3D images of protein structures and their ontologies were released using PyMOL 2.4.0 [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Codon 9628 Evolved Under Episodic Positive Selection</title>
        <p>Mixed evolutionary analysis based on the MEME algorithm was conducted on the SARS-CoV-2 data from Italy, Sweden, and Congo (countries from the same geographic meridian) and Brazil (included as an outgroup). The investigation revealed codon 9628 was under episodic positive selective pressure across the countries, as depicted in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Mixed effects model of evolution (MEME_ analysis results showing data obtained from the evolutionary analysis of SARS-CoV-2 from Brazil, Congo, Italy, and Sweden. The top 3 sites for every country are shown, sorted by <italic>P</italic> value.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="100"/>
            <col width="90"/>
            <col width="40"/>
            <col width="40"/>
            <col width="40"/>
            <col width="70"/>
            <col width="60"/>
            <col width="60"/>
            <col width="70"/>
            <col width="110"/>
            <col width="100"/>
            <col width="70"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Country (ID)/Site</td>
                <td>Partition</td>
                <td>α</td>
                <td>β<sup>−</sup></td>
                <td>
                  <italic>p<sup>−</sup></italic>
                </td>
                <td>β<sup>+</sup></td>
                <td>
                  <italic>p<sup>+</sup></italic>
                </td>
                <td>LRT</td>
                <td><italic>P</italic> value</td>
                <td>Branches under selection</td>
                <td>Total branch length</td>
                <td>MEME LogL</td>
                <td>Fixed effects likelihood LogL</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="14">
                  <bold>Brazil (BR)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>9628<sup>a</sup></td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.96</td>
                <td>10,000</td>
                <td>0.04</td>
                <td>16.37</td>
                <td>&lt;.001</td>
                <td>2</td>
                <td>0.65</td>
                <td>-27.28</td>
                <td>-20.62</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>9928</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.82</td>
                <td>10,000</td>
                <td>0.18</td>
                <td>11.12</td>
                <td>&lt;.001</td>
                <td>4</td>
                <td>2.71</td>
                <td>-31.03</td>
                <td>-28.53</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>81</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.04</td>
                <td>1032.18</td>
                <td>0.96</td>
                <td>6.95</td>
                <td>.01</td>
                <td>5</td>
                <td>1.49</td>
                <td>-40.77</td>
                <td>-40.77</td>
              </tr>
              <tr valign="top">
                <td colspan="14">
                  <bold>Congo (CG)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>9628<sup>a</sup></td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.97</td>
                <td>10,000</td>
                <td>0.03</td>
                <td>10.89</td>
                <td>&lt;.001</td>
                <td>1</td>
                <td>0.25</td>
                <td>-18.18</td>
                <td>-13.54</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2884</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.45</td>
                <td>1273.45</td>
                <td>0.55</td>
                <td>3.51</td>
                <td>.08</td>
                <td>5</td>
                <td>0.60</td>
                <td>-42.49</td>
                <td>-42.37</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>6541</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.97</td>
                <td>10,000</td>
                <td>0.03</td>
                <td>2.73</td>
                <td>.12</td>
                <td>1</td>
                <td>0.27</td>
                <td>-12.94</td>
                <td>-11.92</td>
              </tr>
              <tr valign="top">
                <td colspan="14">
                  <bold>Italy (IT)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>15</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.96</td>
                <td>10,000</td>
                <td>0.04</td>
                <td>10.21</td>
                <td>&lt;.001</td>
                <td>1</td>
                <td>0.73</td>
                <td>-15.90</td>
                <td>-12.57</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>9628<sup>a</sup></td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.97</td>
                <td>1,0000</td>
                <td>0.03</td>
                <td>11.24</td>
                <td>&lt;.001</td>
                <td>1</td>
                <td>0.45</td>
                <td>-17.66</td>
                <td>-12.95</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.89</td>
                <td>10,000</td>
                <td>0.11</td>
                <td>7.25</td>
                <td>.01</td>
                <td>0</td>
                <td>1.83</td>
                <td>-13.11</td>
                <td>-10.43</td>
              </tr>
              <tr valign="top">
                <td colspan="14">
                  <bold>Sweden (SE)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>9628<sup>a</sup></td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.96</td>
                <td>9613.52</td>
                <td>0.04</td>
                <td>16.03</td>
                <td>&lt;.001</td>
                <td>2</td>
                <td>0.51</td>
                <td>-27.43</td>
                <td>-21.10</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4409</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.97</td>
                <td>4356.70</td>
                <td>0.03</td>
                <td>7.68</td>
                <td>.01</td>
                <td>1</td>
                <td>0.16</td>
                <td>-15.63</td>
                <td>-12.33</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4732</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0.95</td>
                <td>10,000</td>
                <td>0.05</td>
                <td>3.85</td>
                <td>.07</td>
                <td>2</td>
                <td>0.74</td>
                <td>-19.66</td>
                <td>-18.78</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Indicates site 9628.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>In this context, we use the term “site” as a synonym of codon, respecting the HyPhy terminology. The asymptotic <italic>P</italic> value was &lt;.001 for episodic diversification at site 9628. <xref rid="figure1" ref-type="fig">Figure 1</xref> shows the distribution of the <italic>P</italic> value across the sites for all 4 countries.</p>
        <p>A deep check of the multiple alignment data of the 4 countries revealed that the episodic positive selective pressure on site 9628 is a consistent mutation of the codon GGG to ACG, as shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Mixed effects model of evolution site plot. Distribution of the <italic>P</italic> value over the sites in Brazil, Congo, Italy, and Sweden. The purple circle indicates site 9628 that was found to be under episodic selective pressure.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Part of the multiple sequence alignment from the Italian data showing the site 9628 under episodic selective pressure. The nucleotides mute from GGG to ACG.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>RNA Secondary Structure Prediction Changes</title>
        <p>The prediction of secondary structure before and after mutation shows important differences, as shown by the mutation from GGG to ACG (<xref rid="figure3" ref-type="fig">Figure 3</xref>). The comparison between the 2 predicted secondary structures highlighted structural modifications at the top-right ring of the RNA conformation, as depicted in <xref rid="figure4" ref-type="fig">Figure 4</xref>, suggesting the GGG to ACG mutation was responsible for a significant modification of the RNA secondary structure.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Nucleotide mutation over aligned sequences, illustrating the sequence considered to predict secondary structures in both mutated and wild-type proteins. Site position is indicated in blue, from the start codon (9578) to the open reading frame (9632).</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Secondary structure prediction. The 2 RNA diagrams exhibit structural modifications affected by the GGG to ACG mutation.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Protein Analysis</title>
        <p>The analysis of the protein conducted for finding its disordered region turned out the positions from 41 to 59 to be more stable with the glycine (G) placed at the 50th position. We obtained results by using 3 different software tools and considering the average value for the probability of disorder, as shown in <xref rid="figure5" ref-type="fig">Figure 5</xref> and reported in <xref ref-type="table" rid="table2">Table 2</xref>. Further analysis to locate the transmembrane region in the protein revealed that locations 54-67 were associated with this function. The analysis, conducted by using 4 distinct web applications and by evaluating the resultant average values, places the glycine (G) as near the transmembrane region to suppose its involvement. <xref ref-type="table" rid="table3">Table 3</xref> reports the data showing the probabilities of each amino acid acting as the transmembrane. The transmembrane topology of the sequence (<xref rid="figure6" ref-type="fig">Figure 6</xref>) highlights the amino acid G at location 50 in the middle of the transmembrane region, and the distribution of the probabilities (<xref rid="figure7" ref-type="fig">Figure 7</xref>) corroborates this hypothesis.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Disorder region analysis. The region 41-59 was found to have the lowest probability to be disordered. The orange lines delimit this region, and the blue dotted line outlines the position of G on the different curves.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Protein disorder analysis results showing the probability of disorder for each position of the protein. The probabilities have been calculated using MFDp2, Netsurf, and SPOTD software.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="180"/>
            <col width="180"/>
            <col width="180"/>
            <col width="180"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Position</td>
                <td>Amino acid sequence</td>
                <td colspan="4">Disorder probability values</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>MFDp2</td>
                <td>NetsurfP2</td>
                <td>SPOTD</td>
                <td>Average value<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>M</td>
                <td>0.132</td>
                <td>0.627823114</td>
                <td>0.5607</td>
                <td>0.440174371</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>L</td>
                <td>0.134</td>
                <td>0.347978383</td>
                <td>0.5358</td>
                <td>0.339259461</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Q</td>
                <td>0.135</td>
                <td>0.270706475</td>
                <td>0.4945</td>
                <td>0.300068825</td>
              </tr>
              <tr valign="top">
                <td>…</td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>39</td>
                <td>T</td>
                <td>0.03</td>
                <td>0.010842944</td>
                <td>0.1936</td>
                <td>0.078147648</td>
              </tr>
              <tr valign="top">
                <td>40</td>
                <td>V</td>
                <td>0.029</td>
                <td>0.007660664</td>
                <td>0.189</td>
                <td>0.075220221</td>
              </tr>
              <tr valign="top">
                <td>41</td>
                <td>Q</td>
                <td>0.027</td>
                <td>0.004478907</td>
                <td>0.172</td>
                <td>0.067826302</td>
              </tr>
              <tr valign="top">
                <td>42</td>
                <td>E</td>
                <td>0.025</td>
                <td>0.00340931</td>
                <td>0.1848</td>
                <td>0.07106977</td>
              </tr>
              <tr valign="top">
                <td>43</td>
                <td>I</td>
                <td>0.025</td>
                <td>0.003887762</td>
                <td>0.1968</td>
                <td>0.075229254</td>
              </tr>
              <tr valign="top">
                <td>44</td>
                <td>Q</td>
                <td>0.024</td>
                <td>0.003997837</td>
                <td>0.1927</td>
                <td>0.073565946</td>
              </tr>
              <tr valign="top">
                <td>45</td>
                <td>L</td>
                <td>0.023</td>
                <td>0.00361518</td>
                <td>0.2129</td>
                <td>0.079838393</td>
              </tr>
              <tr valign="top">
                <td>46</td>
                <td>Q</td>
                <td>0.023</td>
                <td>0.004551574</td>
                <td>0.2123</td>
                <td>0.079950525</td>
              </tr>
              <tr valign="top">
                <td>47</td>
                <td>A</td>
                <td>0.023</td>
                <td>0.004939525</td>
                <td>0.2011</td>
                <td>0.076346508</td>
              </tr>
              <tr valign="top">
                <td>48</td>
                <td>A</td>
                <td>0.022</td>
                <td>0.005752307</td>
                <td>0.2133</td>
                <td>0.080350769</td>
              </tr>
              <tr valign="top">
                <td>49</td>
                <td>V</td>
                <td>0.022</td>
                <td>0.002826149</td>
                <td>0.2524</td>
                <td>0.092408716</td>
              </tr>
              <tr valign="top">
                <td>50<sup>b</sup></td>
                <td>G</td>
                <td>0.022</td>
                <td>0.005828088</td>
                <td>0.2013</td>
                <td>0.076376029</td>
              </tr>
              <tr valign="top">
                <td>51</td>
                <td>E</td>
                <td>0.022</td>
                <td>0.001046103</td>
                <td>0.24</td>
                <td>0.087682034</td>
              </tr>
              <tr valign="top">
                <td>52</td>
                <td>L</td>
                <td>0.023</td>
                <td>0.000922468</td>
                <td>0.2694</td>
                <td>0.097774156</td>
              </tr>
              <tr valign="top">
                <td>53</td>
                <td>L</td>
                <td>0.023</td>
                <td>0.001263275</td>
                <td>0.2588</td>
                <td>0.094354425</td>
              </tr>
              <tr valign="top">
                <td>54</td>
                <td>L</td>
                <td>0.023</td>
                <td>0.001187441</td>
                <td>0.2539</td>
                <td>0.092695814</td>
              </tr>
              <tr valign="top">
                <td>55</td>
                <td>L</td>
                <td>0.023</td>
                <td>0.000650476</td>
                <td>0.2483</td>
                <td>0.090650159</td>
              </tr>
              <tr valign="top">
                <td>56</td>
                <td>E</td>
                <td>0.023</td>
                <td>0.000615434</td>
                <td>0.2328</td>
                <td>0.085471811</td>
              </tr>
              <tr valign="top">
                <td>57</td>
                <td>W</td>
                <td>0.023</td>
                <td>0.001080571</td>
                <td>0.2302</td>
                <td>0.08476019</td>
              </tr>
              <tr valign="top">
                <td>58</td>
                <td>L</td>
                <td>0.023</td>
                <td>0.000941573</td>
                <td>0.2154</td>
                <td>0.079780524</td>
              </tr>
              <tr valign="top">
                <td>59</td>
                <td>A</td>
                <td>0.023</td>
                <td>0.001573079</td>
                <td>0.208</td>
                <td>0.07752436</td>
              </tr>
              <tr valign="top">
                <td>60</td>
                <td>M</td>
                <td>0.024</td>
                <td>0.000997698</td>
                <td>0.2853</td>
                <td>0.103432566</td>
              </tr>
              <tr valign="top">
                <td>61</td>
                <td>A</td>
                <td>0.024</td>
                <td>0.00227783</td>
                <td>0.3026</td>
                <td>0.109625943</td>
              </tr>
              <tr valign="top">
                <td>62</td>
                <td>V</td>
                <td>0.025</td>
                <td>0.003362786</td>
                <td>0.3503</td>
                <td>0.126220929</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Average values of the disorder probability for each position.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Amino acid G placed at position 50, inside the stable region.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Transmembrane prediction results obtained using TMHMM, MemBrainTHM, ProtScale, and TMpred applications. Results from ProtScale and TMpred have been normalized for comparison with other probabilities.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="90"/>
            <col width="130"/>
            <col width="160"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>Position</td>
                <td>Amino acid sequence</td>
                <td>TMHMM probability</td>
                <td>MemBrain THM propensity</td>
                <td>ProtScale normalized score</td>
                <td>TMpred normalized score</td>
                <td>Transmembrane probability, average value<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>M</td>
                <td>0</td>
                <td>0.000191</td>
                <td>N/A<sup>b</sup></td>
                <td>0.661425764</td>
                <td>0.220538921</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>L</td>
                <td>0</td>
                <td>0.002851</td>
                <td>N/A<sup>b</sup></td>
                <td>0.661425764</td>
                <td>0.221425588</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Q</td>
                <td>0</td>
                <td>0.046538</td>
                <td>N/A<sup>b</sup></td>
                <td>0.661425764</td>
                <td>0.235987921</td>
              </tr>
              <tr valign="top">
                <td>…</td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>49</td>
                <td>V</td>
                <td>0.2594</td>
                <td>0.987914</td>
                <td>0.646</td>
                <td>0.603358942</td>
                <td>0.624168236</td>
              </tr>
              <tr valign="top">
                <td>50<sup>c</sup></td>
                <td>G</td>
                <td>0.27719</td>
                <td>0.987914</td>
                <td>0.646</td>
                <td>0.629801679</td>
                <td>0.63522642</td>
              </tr>
              <tr valign="top">
                <td>51</td>
                <td>E</td>
                <td>0.28083</td>
                <td>0.991702</td>
                <td>0.736</td>
                <td>0.660532428</td>
                <td>0.667266107</td>
              </tr>
              <tr valign="top">
                <td>52</td>
                <td>L</td>
                <td>0.32735</td>
                <td>0.993857</td>
                <td>0.67</td>
                <td>0.594246918</td>
                <td>0.646363479</td>
              </tr>
              <tr valign="top">
                <td>53</td>
                <td>L</td>
                <td>0.56651</td>
                <td>0.993857</td>
                <td>0.637</td>
                <td>0.778452743</td>
                <td>0.743954936</td>
              </tr>
              <tr valign="top">
                <td>54</td>
                <td>L</td>
                <td>0.63937</td>
                <td>0.994522</td>
                <td>0.632</td>
                <td>0.73360729</td>
                <td>0.749874822</td>
              </tr>
              <tr valign="top">
                <td>55</td>
                <td>L</td>
                <td>0.64032</td>
                <td>0.990459</td>
                <td>0.659</td>
                <td>0.818831517</td>
                <td>0.777152629</td>
              </tr>
              <tr valign="top">
                <td>56</td>
                <td>E</td>
                <td>0.64052</td>
                <td>0.96027</td>
                <td>0.726</td>
                <td>0.835626228</td>
                <td>0.790604057</td>
              </tr>
              <tr valign="top">
                <td>57</td>
                <td>W</td>
                <td>0.64826</td>
                <td>0.946819</td>
                <td>0.701</td>
                <td>0.822583527</td>
                <td>0.779665632</td>
              </tr>
              <tr valign="top">
                <td>58</td>
                <td>L</td>
                <td>0.6493</td>
                <td>0.947424</td>
                <td>0.706</td>
                <td>0.895122387</td>
                <td>0.799461597</td>
              </tr>
              <tr valign="top">
                <td>59</td>
                <td>A</td>
                <td>0.64928</td>
                <td>0.947424</td>
                <td>0.683</td>
                <td>0.905663748</td>
                <td>0.796341937</td>
              </tr>
              <tr valign="top">
                <td>60</td>
                <td>M</td>
                <td>0.64927</td>
                <td>0.970735</td>
                <td>0.683</td>
                <td>0.947293193</td>
                <td>0.812574548</td>
              </tr>
              <tr valign="top">
                <td>61</td>
                <td>A</td>
                <td>0.64924</td>
                <td>0.970735</td>
                <td>0.773</td>
                <td>0.955511881</td>
                <td>0.83712172</td>
              </tr>
              <tr valign="top">
                <td>62</td>
                <td>V</td>
                <td>0.64903</td>
                <td>0.937507</td>
                <td>0.831</td>
                <td>1</td>
                <td>0.85438425</td>
              </tr>
              <tr valign="top">
                <td>63</td>
                <td>M</td>
                <td>0.64893</td>
                <td>0.892506</td>
                <td>0.831</td>
                <td>0.960871896</td>
                <td>0.833326974</td>
              </tr>
              <tr valign="top">
                <td>64</td>
                <td>L</td>
                <td>0.6482</td>
                <td>0.846403</td>
                <td>0.84</td>
                <td>0.942826514</td>
                <td>0.819357379</td>
              </tr>
              <tr valign="top">
                <td>65</td>
                <td>L</td>
                <td>0.64758</td>
                <td>0.781733</td>
                <td>0.847</td>
                <td>0.924066464</td>
                <td>0.800094866</td>
              </tr>
              <tr valign="top">
                <td>66</td>
                <td>L</td>
                <td>0.63557</td>
                <td>0.670387</td>
                <td>0.856</td>
                <td>0.661425764</td>
                <td>0.705845691</td>
              </tr>
              <tr valign="top">
                <td>67</td>
                <td>L</td>
                <td>0.61835</td>
                <td>0.539353</td>
                <td>0.851</td>
                <td>0.661425764</td>
                <td>0.667532191</td>
              </tr>
              <tr valign="top">
                <td>68</td>
                <td>C</td>
                <td>0.5428</td>
                <td>0.455615</td>
                <td>0.819</td>
                <td>0.661425764</td>
                <td>0.619710191</td>
              </tr>
              <tr valign="top">
                <td>69</td>
                <td>C</td>
                <td>0.51009</td>
                <td>0.430385</td>
                <td>0.728</td>
                <td>0.661425764</td>
                <td>0.582475191</td>
              </tr>
              <tr valign="top">
                <td>70</td>
                <td>C</td>
                <td>0.44702</td>
                <td>0.380525</td>
                <td>N/A<sup>b</sup></td>
                <td>0.661425764</td>
                <td>0.496323588</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Average values of the probability for each position.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>The window size used for the profile computation is 9, so the score is not applicable for positions 1-4 and 70-73.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Amino acid G placed at position 50, inside the stable region.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Topology diagram using the MemBrain v3. The illustration depicts the transmembrane topology of the sequence and highlights that the amino acid at position 50 (G) is positioned into the middle of the transmembrane region. Red: transmembrane helix (TMH); blue: loop.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Transmembrane prediction. The region 54-67 was found to be the region with the highest probability to code for the transmembrane, and the G amino acid is near enough to suppose its involvement. The orange lines delimit this region, and the blue dotted line outlines the position of G on the different curves.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>3D Protein Analysis</title>
        <p>To characterize the deduced protein P0DTD3.1, we predicted the 3D structures for both the wild-type and mutated protein sequences using an ab initio approach. According to the preliminary clue from the secondary structure prediction, the mutated protein presents a slightly different structure when the amino acid residue changed from G to T. <xref rid="figure8" ref-type="fig">Figures 8</xref> and <xref rid="figure9" ref-type="fig">9</xref> illustrate both the predicted models showing that the mutation would affect the tertiary structure of the protein. The comparison of residues 45-55 between MUT31136 and MOD30336 showed that this portion of the protein with the mutation stretches out with repercussions to the preceding helix. This result suggests that the mutation of the single amino acid from G to T, with consecutive stretching cycles on the 3D structure of the protein, tends to make the protein assume new functions.</p>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Prediction of the 3D structure for the mutated protein of SARS-CoV-2. The model MUT31136 represents the predicted 3D model of the protein subject to mutation. (A) Amino acid sequence colored by the spectrum range, with the mutated amino acid indicated in black color at position 50 (T). (B) The protein has been oriented to facilitate the comparison and residue 50 is represented with red dots. (C) Details of the residues 45-55 and their rotation (D) around the Y-axis and (E) around the X-axis with a step of 90˚.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure9" position="float">
          <label>Figure 9</label>
          <caption>
            <p>Prediction of the 3D structure of the unchanged protein. The model MOD30506 represents the predicted 3D model of the wild-type protein. (A) Amino acid sequence colored by the spectrum range, with the investigated amino acid indicated in black color at position 50 (G). (B) The protein has been oriented to facilitate the comparison and the residue 50 is represented with the red dots. (C) Details of the residues 45-55 and their rotation (D) around the Y-axis and (E) around the X-axis with a step of 90˚.</p>
          </caption>
          <graphic xlink:href="bioinform_v2i1e25995_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Prediction of Protein-Related Ontologies</title>
        <p>The analysis of protein ontologies indicates different functions between the wild-type and mutated proteins, owing to their changed structures. As shown in <xref ref-type="table" rid="table4">Table 4</xref>, the wild-type variant of the protein is linked with a high probability (.978≤<italic>P</italic>≤1) to both catalytic and transferase activities. The mutated variant of the protein presents a remarkable change in its functionality trend: even if usually the scores below 0.5 are interpreted as negative predictions, in an evolutionary context, the decrease in probability of the transferase activity (from 0.98 to 0.375) to favor the binding function (from 0.004 to 0.132) is not regarded as negligible. The contextual inversion of tendency of transferase to binding activity suggests that the episodic evolutionary mutation aims to improve the binding ability of the protein.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Classification report showing the predicted functions of both (mutated and wild-type) protein sequences and related scores. Only positive scores are reported.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Gene ontology terms and function</td>
                <td colspan="2">Score</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Wild-type protein sequence</td>
                <td>Mutated protein sequence</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>GO:0003674</td>
                <td>Molecular function</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>GO:0003824</td>
                <td>Catalytic function</td>
                <td>1</td>
                <td>0.998</td>
              </tr>
              <tr valign="top">
                <td>GO:0016740<sup>a</sup></td>
                <td>Transferase activity</td>
                <td>0.978</td>
                <td>0.375</td>
              </tr>
              <tr valign="top">
                <td>GO:0016829</td>
                <td>Lyase activity</td>
                <td>0.017</td>
                <td>—<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>GO:0022891</td>
                <td>Transmembrane</td>
                <td>0.07</td>
                <td>—<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>GO:0005488<sup>a</sup></td>
                <td>Binding activity</td>
                <td>0.004</td>
                <td>0.132</td>
              </tr>
              <tr valign="top">
                <td>GO:0022892</td>
                <td>Transmembrane transport activity</td>
                <td>0.001</td>
                <td>0.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Ontological functions subjected to inverted tendency.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>Unpredicted function.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>SAR-CoV-2, the virus known to cause the COVID-19 pandemic, has many peculiar characteristics, such as rapidly accumulating mutations, compared to other coronaviruses [<xref ref-type="bibr" rid="ref25">25</xref>]. Specifically, the prevalence of single nucleotide transitions as the major mutational type of SAR-CoV-2 across the world has been shown previously [<xref ref-type="bibr" rid="ref7">7</xref>]. In this study, we conducted evolutionary analyses on the mutations to determine whether SARS-CoV-2 genomes from different countries in the same meridian might have specific variation patterns. We found that codon 9628 was under episodic selective pressure for all 4 countries in the same meridian. This would affect RNA secondary structure and, consequently, the protein product, with T (threonine) changing to G (glycine) in protein position 50. This position is located close to the predicted transmembrane region. Mutation analysis revealed that a change from G (glycine) to D (aspartic acid) may confer a new function to the protein, that is, binding activity, which in turn may be responsible for attaching the virus to human eukaryotic cells. These bioinformatics findings may help in better designing in vitro (wet lab) and in vivo (animal model) experiments to determine protein variants associated with the virulence of the virus. Therefore, these findings may eventually facilitate vaccine design and successful antiviral strategies. For example, the results of this study suggest the need for site-directed mutagenesis and animal experiments to validate the anticipated effects.</p>
        <p>Mercatelli and Georgi [<xref ref-type="bibr" rid="ref7">7</xref>] demonstrated that clade G, prevalent in Europe, carries a D614G mutation in the spike protein, which is responsible for the initial interaction of the virus with the host human cell. Other studies have also shown different mutation locations among strains isolated from different continents. Mutations at positions 2891, 3036, 14408, 23403, and 28881 are predominantly observed in European strains, whereas those located at positions 17746, 17857, and 18060 are exclusively present in North American strains of SARS-CoV-2 [<xref ref-type="bibr" rid="ref26">26</xref>]. Their findings suggest that the virus is evolving and that European, North American, and Asian strains of the virus might coexist, with each characterized by different mutation patterns.</p>
        <p>Furthermore, a comparison of viral genomes of SARS-CoV-2 strains from 13 countries identified differences in the protein-coding sequences. For example, an Indian strain showed a mutation in the spike glycoprotein at R408I and in the replicase polyprotein at I671T, P2144S, and A2798V, whereas the spike protein of Spain and South Korean strains carried an F797C and a S221W mutation, respectively [<xref ref-type="bibr" rid="ref27">27</xref>]. Moreover, recently conducted integrative analyses of SARS-CoV-2 genomes of strains from different geographical locations reveal unique features that are potentially consequential to host-virus interaction and pathogenesis [<xref ref-type="bibr" rid="ref28">28</xref>]. However, the most recent study of genomic diversity and hotspot mutations in 30,983 SARS-CoV-2 genomes indicates that unlike the influenza virus or HIV, SARS-CoV-2 has a low mutation rate, which makes the development of an effective global vaccine very likely [<xref ref-type="bibr" rid="ref29">29</xref>]. The study determined several hotspot mutations across the whole SARS-CoV-2 genome. In all, 14 nonsynonymous hotspot mutations (whose prevalence of mutations is &gt;10%) have been identified at different locations along the viral genome: 8 in ORF1ab polyprotein (in nsp2, nsp3, transmembrane domain, RdRp, helicase, exonuclease, and endoribonuclease), 3 in nucleocapsid protein, and 1 in each of the 3 proteins spike, ORF3a, and ORF8. Moreover, 36 nonsynonymous mutations were identified in the receptor-binding domain of the spike protein with a low prevalence (&lt;1%) across all genomes [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>All these findings highlight the importance of studying the relationship of geographical locations of SARS-CoV-2 isolates and mutations in their genomes, because the relationship can also be confirmed by phylogenetic tree analyses for elucidation of lineages and clusters based on the geographic locations. In conclusion, this genome evolutionary analysis revealed that codon 9628 is under episodic selective pressure for SARS-CoV-2 strains isolated from all 4 countries (Italy, Sweden, Congo, and Brazil) of the same geographical meridian.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">GISaid</term>
          <def>
            <p>Global Initiative on Sharing All Influenza Data</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">MEME</term>
          <def>
            <p>mixed effects model of evolution</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">MERS-CoV</term>
          <def>
            <p>Middle East respiratory syndrome coronavirus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ORF</term>
          <def>
            <p>open reading frames</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by grants of Natural National Science Foundation of China (NSFC81671980, 81871623, 82020108022, Shu-Lin Liu). The funding bodies played no roles in the design of the study; collection, analysis, or interpretation of data; or in writing the manuscript.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bar-Zeev</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Inglesby</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccines: early success and remaining challenges</article-title>
          <source>The Lancet</source>
          <year>2020</year>
          <month>09</month>
          <volume>396</volume>
          <issue>10255</issue>
          <fpage>868</fpage>
          <lpage>869</lpage>
          <pub-id pub-id-type="doi">10.1016/s0140-6736(20)31867-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Logunov</surname>
              <given-names>DY</given-names>
            </name>
            <name name-style="western">
              <surname>Dolzhikova</surname>
              <given-names>IV</given-names>
            </name>
            <name name-style="western">
              <surname>Zubkova</surname>
              <given-names>OV</given-names>
            </name>
            <name name-style="western">
              <surname>Tukhvatulin</surname>
              <given-names>AI</given-names>
            </name>
            <name name-style="western">
              <surname>Shcheblyakov</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Dzharullaeva</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Grousova</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Erokhova</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Kovyrshina</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Botikov</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Izhaeva</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Popova</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Ozharovskaya</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Esmagambetov</surname>
              <given-names>IB</given-names>
            </name>
            <name name-style="western">
              <surname>Favorskaya</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Zrelkin</surname>
              <given-names>DI</given-names>
            </name>
            <name name-style="western">
              <surname>Voronina</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Shcherbinin</surname>
              <given-names>DN</given-names>
            </name>
            <name name-style="western">
              <surname>Semikhin</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Simakova</surname>
              <given-names>YV</given-names>
            </name>
            <name name-style="western">
              <surname>Tokarskaya</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Lubenets</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Egorova</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Shmarov</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Nikitenko</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Morozova</surname>
              <given-names>LF</given-names>
            </name>
            <name name-style="western">
              <surname>Smolyarchuk</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Kryukov</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Babira</surname>
              <given-names>VF</given-names>
            </name>
            <name name-style="western">
              <surname>Borisevich</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Naroditsky</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Gintsburg</surname>
              <given-names>AL</given-names>
            </name>
          </person-group>
          <article-title>Safety and immunogenicity of an rAd26 and rAd5 vector-based heterologous prime-boost COVID-19 vaccine in two formulations: two open, non-randomised phase 1/2 studies from Russia</article-title>
          <source>The Lancet</source>
          <year>2020</year>
          <month>09</month>
          <volume>396</volume>
          <issue>10255</issue>
          <fpage>887</fpage>
          <lpage>897</lpage>
          <pub-id pub-id-type="doi">10.1016/s0140-6736(20)31866-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naqvi</surname>
              <given-names>AAT</given-names>
            </name>
            <name name-style="western">
              <surname>Fatima</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mohammad</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fatima</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>IK</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Atif</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Hariprasad</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Insights into SARS-CoV-2 genome, structure, evolution, pathogenesis and therapies: Structural genomics approach</article-title>
          <source>Biochim Biophys Acta Mol Basis Dis</source>
          <year>2020</year>
          <month>10</month>
          <day>01</day>
          <volume>1866</volume>
          <issue>10</issue>
          <fpage>165878</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32544429"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.bbadis.2020.165878</pub-id>
          <pub-id pub-id-type="medline">32544429</pub-id>
          <pub-id pub-id-type="pii">S0925-4439(20)30226-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7293463</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dilucca</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Forcelloni</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Georgakilas</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Giansanti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pavlopoulou</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Codon usage and phenotypic divergences of SARS-CoV-2 genes</article-title>
          <source>Viruses</source>
          <year>2020</year>
          <month>04</month>
          <day>30</day>
          <volume>12</volume>
          <issue>5</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=v12050498"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/v12050498</pub-id>
          <pub-id pub-id-type="medline">32366025</pub-id>
          <pub-id pub-id-type="pii">v12050498</pub-id>
          <pub-id pub-id-type="pmcid">PMC7290700</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khailany</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Safdar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ozaslan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Genomic characterization of a novel SARS-CoV-2</article-title>
          <source>Gene Rep</source>
          <year>2020</year>
          <month>06</month>
          <volume>19</volume>
          <fpage>100682</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32300673"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.genrep.2020.100682</pub-id>
          <pub-id pub-id-type="medline">32300673</pub-id>
          <pub-id pub-id-type="pii">S2452-0144(20)30096-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7161481</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gussow</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Auslander</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Faure</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>YI</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Koonin</surname>
              <given-names>EV</given-names>
            </name>
          </person-group>
          <article-title>Genomic determinants of pathogenicity in SARS-CoV-2 and other human coronaviruses</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2020</year>
          <month>06</month>
          <day>30</day>
          <volume>117</volume>
          <issue>26</issue>
          <fpage>15193</fpage>
          <lpage>15199</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&amp;pmid=32522874"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.2008176117</pub-id>
          <pub-id pub-id-type="medline">32522874</pub-id>
          <pub-id pub-id-type="pii">2008176117</pub-id>
          <pub-id pub-id-type="pmcid">PMC7334499</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mercatelli</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Giorgi</surname>
              <given-names>FM</given-names>
            </name>
          </person-group>
          <article-title>Geographic and genomic distribution of SARS-CoV-2 mutations</article-title>
          <source>Front Microbiol</source>
          <year>2020</year>
          <volume>11</volume>
          <fpage>1800</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fmicb.2020.01800"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fmicb.2020.01800</pub-id>
          <pub-id pub-id-type="medline">32793182</pub-id>
          <pub-id pub-id-type="pmcid">PMC7387429</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Forster</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Forster</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Renfrew</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Forster</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Phylogenetic network analysis of SARS-CoV-2 genomes</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2020</year>
          <month>04</month>
          <day>28</day>
          <volume>117</volume>
          <issue>17</issue>
          <fpage>9241</fpage>
          <lpage>9243</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&amp;pmid=32269081"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.2004999117</pub-id>
          <pub-id pub-id-type="medline">32269081</pub-id>
          <pub-id pub-id-type="pii">2004999117</pub-id>
          <pub-id pub-id-type="pmcid">PMC7196762</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Hoque</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Alam</surname>
              <given-names>ASMRU</given-names>
            </name>
            <name name-style="western">
              <surname>Akther</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Puspo</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Akter</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sultana</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Crandall</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Hossain</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Genome-wide analysis of SARS-CoV-2 virus strains circulating worldwide implicates heterogeneity</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>08</month>
          <day>19</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>14004</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-70812-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-70812-6</pub-id>
          <pub-id pub-id-type="medline">32814791</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-70812-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7438523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Libin</surname>
              <given-names>PJK</given-names>
            </name>
            <name name-style="western">
              <surname>Deforche</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Abecasis</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Theys</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>VIRULIGN: fast codon-correct alignment and annotation of viral genomes</article-title>
          <source>Bioinformatics</source>
          <year>2019</year>
          <month>05</month>
          <day>15</day>
          <volume>35</volume>
          <issue>10</issue>
          <fpage>1763</fpage>
          <lpage>1765</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30295730"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/bty851</pub-id>
          <pub-id pub-id-type="medline">30295730</pub-id>
          <pub-id pub-id-type="pii">5123354</pub-id>
          <pub-id pub-id-type="pmcid">PMC6513156</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Larsson</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>AliView: a fast and lightweight alignment viewer and editor for large datasets</article-title>
          <source>Bioinformatics</source>
          <year>2014</year>
          <month>11</month>
          <day>15</day>
          <volume>30</volume>
          <issue>22</issue>
          <fpage>3276</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25095880"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btu531</pub-id>
          <pub-id pub-id-type="medline">25095880</pub-id>
          <pub-id pub-id-type="pii">btu531</pub-id>
          <pub-id pub-id-type="pmcid">PMC4221126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murrell</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wertheim</surname>
              <given-names>JO</given-names>
            </name>
            <name name-style="western">
              <surname>Moola</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weighill</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Scheffler</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kosakovsky Pond</surname>
              <given-names>SL</given-names>
            </name>
          </person-group>
          <article-title>Detecting individual sites subject to episodic diversifying selection</article-title>
          <source>PLoS Genet</source>
          <year>2012</year>
          <volume>8</volume>
          <issue>7</issue>
          <fpage>e1002764</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pgen.1002764"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pgen.1002764</pub-id>
          <pub-id pub-id-type="medline">22807683</pub-id>
          <pub-id pub-id-type="pii">PGENETICS-D-12-00164</pub-id>
          <pub-id pub-id-type="pmcid">PMC3395634</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lorenz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bernhart</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Höner Zu Siederdissen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tafer</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Flamm</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Stadler</surname>
              <given-names>PF</given-names>
            </name>
            <name name-style="western">
              <surname>Hofacker</surname>
              <given-names>IL</given-names>
            </name>
          </person-group>
          <article-title>ViennaRNA Package 2.0</article-title>
          <source>Algorithms Mol Biol</source>
          <year>2011</year>
          <month>11</month>
          <day>24</day>
          <volume>6</volume>
          <fpage>26</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://almob.biomedcentral.com/articles/10.1186/1748-7188-6-26"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1748-7188-6-26</pub-id>
          <pub-id pub-id-type="medline">22115189</pub-id>
          <pub-id pub-id-type="pii">1748-7188-6-26</pub-id>
          <pub-id pub-id-type="pmcid">PMC3319429</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kerpedjiev</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hammer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hofacker</surname>
              <given-names>IL</given-names>
            </name>
          </person-group>
          <article-title>Forna (force-directed RNA): Simple and effective online RNA secondary structure diagrams</article-title>
          <source>Bioinformatics</source>
          <year>2015</year>
          <month>10</month>
          <day>15</day>
          <volume>31</volume>
          <issue>20</issue>
          <fpage>3377</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26099263"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btv372</pub-id>
          <pub-id pub-id-type="medline">26099263</pub-id>
          <pub-id pub-id-type="pii">btv372</pub-id>
          <pub-id pub-id-type="pmcid">PMC4595900</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mizianty</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Uversky</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Kurgan</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Prediction of intrinsic disorder in proteins using MFDp2</article-title>
          <source>Methods Mol Biol</source>
          <year>2014</year>
          <volume>1137</volume>
          <fpage>147</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1007/978-1-4939-0366-5_11</pub-id>
          <pub-id pub-id-type="medline">24573480</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Klausen</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Jespersen</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Jurtz</surname>
              <given-names>VI</given-names>
            </name>
            <name name-style="western">
              <surname>Sønderby</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Sommer</surname>
              <given-names>MOA</given-names>
            </name>
            <name name-style="western">
              <surname>Winther</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Petersen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Marcatili</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>NetSurfP-2.0: Improved prediction of protein structural features by integrated deep learning</article-title>
          <source>Proteins</source>
          <year>2019</year>
          <month>06</month>
          <day>09</day>
          <volume>87</volume>
          <issue>6</issue>
          <fpage>520</fpage>
          <lpage>527</lpage>
          <pub-id pub-id-type="doi">10.1002/prot.25674</pub-id>
          <pub-id pub-id-type="medline">30785653</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hanson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Paliwal</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Litfin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>SPOT-Disorder2: improved protein intrinsic disorder prediction by ensembled deep learning</article-title>
          <source>Genomics Proteomics Bioinformatics</source>
          <year>2019</year>
          <month>12</month>
          <volume>17</volume>
          <issue>6</issue>
          <fpage>645</fpage>
          <lpage>656</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1672-0229(20)30024-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.gpb.2019.01.004</pub-id>
          <pub-id pub-id-type="medline">32173600</pub-id>
          <pub-id pub-id-type="pii">S1672-0229(20)30024-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7212484</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>MemBrain: an easy-to-use online webserver for transmembrane protein structure prediction</article-title>
          <source>Nanomicro Lett</source>
          <year>2018</year>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>2</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30393651"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40820-017-0156-2</pub-id>
          <pub-id pub-id-type="medline">30393651</pub-id>
          <pub-id pub-id-type="pii">156</pub-id>
          <pub-id pub-id-type="pmcid">PMC6199043</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilkins</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Gasteiger</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bairoch</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez</surname>
              <given-names>J-C</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Appel</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Hochstrasser</surname>
              <given-names>DF</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Link</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Protein identification and analysis tools in the ExPASy server</article-title>
          <source>2-D Proteome Analysis Protocols. Methods in Molecular Biology vol. 112</source>
          <year>1999</year>
          <publisher-loc>Totowa, NJ</publisher-loc>
          <publisher-name>Humana Press</publisher-name>
          <fpage>531</fpage>
          <lpage>52</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hofmann</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Stoffel</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>TMbase-a database of membrane spanning proteins segments. Biol. Chem. Hoppe-Seyler, 374</article-title>
          <source>Biol. Chem. Hoppe-Seyler</source>
          <year>1993</year>
          <volume>374</volume>
          <fpage>166</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://embnet.vital-it.ch/software/tmbase/TMBASE_doc.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gasteiger</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gattiker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hoogland</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ivanyi</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Appel</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Bairoch</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>ExPASy: The proteomics server for in-depth protein knowledge and analysis</article-title>
          <source>Nucleic Acids Res</source>
          <year>2003</year>
          <month>07</month>
          <day>01</day>
          <volume>31</volume>
          <issue>13</issue>
          <fpage>3784</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/12824418"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkg563</pub-id>
          <pub-id pub-id-type="medline">12824418</pub-id>
          <pub-id pub-id-type="pmcid">PMC168970</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Chivian</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Protein structure prediction and analysis using the Robetta server</article-title>
          <source>Nucleic Acids Res</source>
          <year>2004</year>
          <month>07</month>
          <day>01</day>
          <volume>32</volume>
          <issue>Web Server issue</issue>
          <fpage>W526</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/15215442"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkh468</pub-id>
          <pub-id pub-id-type="medline">15215442</pub-id>
          <pub-id pub-id-type="pii">32/suppl_2/W526</pub-id>
          <pub-id pub-id-type="pmcid">PMC441606</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Upmeier zu Belzen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bürgel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Holderbach</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bubeck</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Adam</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gandor</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mathony</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pfuderer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Platz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Przybilla</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schwendemann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Heid</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Jendrusch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schmelas</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Waldhauer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lehmann</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Niopek</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Eils</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Leveraging implicit knowledge in neural networks for functional dissection and engineering of proteins</article-title>
          <source>Nat Mach Intell</source>
          <year>2019</year>
          <month>5</month>
          <day>13</day>
          <volume>1</volume>
          <issue>5</issue>
          <fpage>225</fpage>
          <lpage>235</lpage>
          <pub-id pub-id-type="doi">10.1038/s42256-019-0049-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rigsby</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Parker</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>Using the PyMOL application to reinforce visual understanding of protein structure</article-title>
          <source>Biochem Mol Biol Educ</source>
          <year>2016</year>
          <month>09</month>
          <day>10</day>
          <volume>44</volume>
          <issue>5</issue>
          <fpage>433</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/bmb.20966"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/bmb.20966</pub-id>
          <pub-id pub-id-type="medline">27241834</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y-P</given-names>
            </name>
            <name name-style="western">
              <surname>Boerwinkle</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>Y-X</given-names>
            </name>
          </person-group>
          <article-title>Moderate mutation rate in the SARS coronavirus genome and its implications</article-title>
          <source>BMC Evol Biol</source>
          <year>2004</year>
          <month>06</month>
          <day>28</day>
          <volume>4</volume>
          <fpage>21</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcevolbiol.biomedcentral.com/articles/10.1186/1471-2148-4-21"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2148-4-21</pub-id>
          <pub-id pub-id-type="medline">15222897</pub-id>
          <pub-id pub-id-type="pii">1471-2148-4-21</pub-id>
          <pub-id pub-id-type="pmcid">PMC446188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pachetti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marini</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Benedetti</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Giudici</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mauro</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Storici</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Masciovecchio</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Angeletti</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ciccozzi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gallo</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Zella</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ippodrino</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Emerging SARS-CoV-2 mutation hot spots include a novel RNA-dependent-RNA polymerase variant</article-title>
          <source>J Transl Med</source>
          <year>2020</year>
          <month>04</month>
          <day>22</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>179</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://translational-medicine.biomedcentral.com/articles/10.1186/s12967-020-02344-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12967-020-02344-6</pub-id>
          <pub-id pub-id-type="medline">32321524</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12967-020-02344-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7174922</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>ZA</given-names>
            </name>
            <name name-style="western">
              <surname>Baig</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Farouk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>YG</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Comparative genome analysis of novel coronavirus (SARS-CoV-2) from different geographical locations and the effect of mutations on major target proteins: An in silico insight</article-title>
          <source>PLoS One</source>
          <year>2020</year>
          <volume>15</volume>
          <issue>9</issue>
          <fpage>e0238344</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0238344"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0238344</pub-id>
          <pub-id pub-id-type="medline">32881907</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-12188</pub-id>
          <pub-id pub-id-type="pmcid">PMC7470274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sardar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Satish</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Birla</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Integrative analyses of SARS-CoV-2 genomes from different geographical locations reveal unique features potentially consequential to host-virus interaction, pathogenesis and clues for novel therapies</article-title>
          <source>Heliyon</source>
          <year>2020</year>
          <month>09</month>
          <volume>6</volume>
          <issue>9</issue>
          <fpage>e04658</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2405-8440(20)31502-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.heliyon.2020.e04658</pub-id>
          <pub-id pub-id-type="medline">32844125</pub-id>
          <pub-id pub-id-type="pii">S2405-8440(20)31502-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC7439967</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alouane</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Laamarti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Essabbar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hakmi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bouricha</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Chemao-Elfihri</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Kartti</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Boumajdi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bendani</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Laamarti</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ghrifi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Allam</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aanniz</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ouadghiri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>El Hafidi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>El Jaoudi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Benrahma</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Attar</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Mentag</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sbabou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nejjari</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Amzazi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Belyamani</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ibrahimi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Genomic diversity and hotspot mutations in 30,983 SARS-CoV-2 genomes: moving toward a universal vaccine for the</article-title>
          <source>Pathogens</source>
          <year>2020</year>
          <month>10</month>
          <day>10</day>
          <volume>9</volume>
          <issue>10</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=pathogens9100829"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/pathogens9100829</pub-id>
          <pub-id pub-id-type="medline">33050463</pub-id>
          <pub-id pub-id-type="pii">pathogens9100829</pub-id>
          <pub-id pub-id-type="pmcid">PMC7600297</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
