<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JBB</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Bioinform Biotech</journal-id>
      <journal-title>JMIR Bioinformatics and Biotechnology</journal-title>
      <issn pub-type="epub">2563-3570</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v3i1e31536</article-id>
      <article-id pub-id-type="pmid">35309411</article-id>
      <article-id pub-id-type="doi">10.2196/31536</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>The Easy-to-Use SARS-CoV-2 Assembler for Genome Sequencing: Development Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Tausch</surname>
            <given-names>Simon</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Miao</surname>
            <given-names>Yu</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Rueca</surname>
            <given-names>Martina</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5162-046X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Giombini</surname>
            <given-names>Emanuela</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2237-9755</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Messina</surname>
            <given-names>Francesco</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Laboratory of Microbiology and Biological Bank</institution>
            <institution>National Institute for Infectious Diseases “Lazzaro Spallanzani”</institution>
            <institution>Istituto di Ricovero e Cura a Carattere Scientifico</institution>
            <addr-line>Via Portuense 292</addr-line>
            <addr-line>Rome, 00149</addr-line>
            <country>Italy</country>
            <phone>39 0655170668</phone>
            <email>francesco.messina@inmi.it</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8076-7217</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Bartolini</surname>
            <given-names>Barbara</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3882-3996</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Di Caro</surname>
            <given-names>Antonino</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6027-3009</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Capobianchi</surname>
            <given-names>Maria Rosaria</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3465-0071</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Gruber</surname>
            <given-names>Cesare EM</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8831-3380</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Laboratory of Virology and Biosafety Laboratories</institution>
        <institution>National Institute for Infectious Diseases “Lazzaro Spallanzani”</institution>
        <institution>Istituto di Ricovero e Cura a Carattere Scientifico</institution>
        <addr-line>Rome</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Laboratory of Microbiology and Biological Bank</institution>
        <institution>National Institute for Infectious Diseases “Lazzaro Spallanzani”</institution>
        <institution>Istituto di Ricovero e Cura a Carattere Scientifico</institution>
        <addr-line>Rome</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>UniCamillus - Saint Camillus International University of Health Sciences</institution>
        <addr-line>Roma</addr-line>
        <country>Italy</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Francesco Messina <email>francesco.messina@inmi.it</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jan-Dec</season>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>14</day>
        <month>3</month>
        <year>2022</year>
      </pub-date>
      <volume>3</volume>
      <issue>1</issue>
      <elocation-id>e31536</elocation-id>
      <history>
        <date date-type="received">
          <day>24</day>
          <month>6</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>30</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>2</day>
          <month>11</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>5</day>
          <month>2</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Martina Rueca, Emanuela Giombini, Francesco Messina, Barbara Bartolini, Antonino Di Caro, Maria Rosaria Capobianchi, Cesare EM Gruber. Originally published in JMIR Bioinformatics and Biotechnology (https://bioinform.jmir.org), 14.03.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Bioinformatics and Biotechnology, is properly cited. The complete bibliographic information, a link to the original publication on https://bioinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://bioinform.jmir.org/2022/1/e31536" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Early sequencing and quick analysis of the SARS-CoV-2 genome have contributed to the understanding of the dynamics of COVID-19 epidemics and in designing countermeasures at a global level.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Amplicon-based next-generation sequencing (NGS) methods are widely used to sequence the SARS-CoV-2 genome and to identify novel variants that are emerging in rapid succession as well as harboring multiple deletions and amino acid–changing mutations.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>To facilitate the analysis of NGS sequencing data obtained from amplicon-based sequencing methods, here, we propose an easy-to-use SARS-CoV-2 genome assembler: the Easy-to-use SARS-CoV-2 Assembler (ESCA) pipeline.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our results have shown that ESCA could perform high-quality genome assembly from Ion Torrent and Illumina raw data and help the user in easily correct low-coverage regions. Moreover, ESCA includes the possibility of comparing assembled genomes of multisample runs through an easy table format.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>In conclusion, ESCA automatically furnished a variant table output file, fundamental to rapidly recognizing variants of interest. Our pipeline could be a useful method for obtaining a complete, rapid, and accurate analysis even with minimal knowledge in bioinformatics.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>SARS-CoV-2 genome</kwd>
        <kwd>bioinformatics tool</kwd>
        <kwd>NGS data analysis</kwd>
        <kwd>COVID-19</kwd>
        <kwd>genome</kwd>
        <kwd>health informatics</kwd>
        <kwd>bioinformatic</kwd>
        <kwd>digital tools</kwd>
        <kwd>algorithms</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Next-generation sequencing (NGS) has reached a pivotal role in the field of emerging infectious diseases by enhancing the development capacity of new diagnostic methods, vaccines, and drugs [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Moreover, a key role has been recognized for sequence data production and sharing in outbreak response and management [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. In the current COVID-19 epidemic, more than 6 million full genome sequences of SARS-CoV-2 have been deposited in publicly accessible databases in the arc of 1 year (ie, GISAID) [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. SARS-CoV-2 genome surveillance on a global scale is permitting real-time analysis of the outbreak, with a direct impact on the public health response. This contribution includes the tracing of SARS-CoV-2 spread over time and space, evidence of emerging variants that may affect pathogenicity, transmission capacity, diagnostic methods, therapeutics, or vaccines [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Recently divergent SARS-CoV-2 variants are emerging in rapid succession, harboring multiple deletions and amino acid mutations. Some mutations occur in the receptor-binding domain of the spike protein and are associated with an increase of angiotensin-converting enzyme 2 (ACE2) affinity as well as a potential reduction of polyclonal human plasma antibody efficacy [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. The growing contribution of sequence information to public health is driving global investment in sequencing facilities and scientific programs [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. The falling cost of generating genomic NGS data provides new chances for sequencing capacity expansion; however, many laboratories have low sequencing capacity and even a lack of expertise for data elaboration.</p>
      <p>While sequencing runs can be performed without consolidated experience in the infectious disease field, virus genomic sequence assembly is often a demanding task. Translating SARS-CoV-2 raw read data into reliable and informative results is complex and requires solid bioinformatics knowledge, particularly for low-coverage samples. Some steps can lead to incorrect variant calling and produce erroneous assembled sequences.</p>
      <p>Supervision of the sequence assembly to avoid inconsistent or misleading assignment of a virus to a taxonomic lineage or clade [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>] as well as evaluation of low-coverage samples to prevent loss of epidemiological information are mandatory.</p>
      <p>Many tools have been developed to support whole genome sequence reconstruction, starting with reads produced by different NGS platforms. However, most tools have been designed for genome assembly of other viruses and often are able to elaborate only a specific type of data. Some of these tools, for example, have implemented the assembly method for one specific platform (ie, Loretta for PacBio data) [<xref ref-type="bibr" rid="ref16">16</xref>] or for a specific sequencing approach (ie, UNAGI for Nanopore and Illumina data) [<xref ref-type="bibr" rid="ref17">17</xref>]. Some sequencing platform manufacturers have proposed pipelines for SARS-CoV-2 genome reconstruction that have been designed to obtain the most accurate sequence from one specific technological output. For example, Illumina developed the DRAGEN tool for SARS-CoV-2 genome analysis, a commercial tool that is temporarily free and available online, while Ion Torrent suggests the iterative refinement meta-assembler (IRMA) for SARS-CoV-2 data analyses, an open-source program developed by the Centers for Disease Control and Prevention (CDC) [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
      <p>We propose the Easy-to-use SARS-CoV-2 Assembler (ESCA) pipeline: a novel reference-based genome assembly pipeline specifically designed for SARS-CoV-2 data analysis. This pipeline was created to support laboratories with limited experience in bioinformatics for SARS-CoV-2 analysis. ESCA can be easily installed and runs in most Linux environments.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>The ESCA pipeline is a reference-based assembly algorithm written for Linux environments and requires only raw reads as input files, without any other information. Two versions of the software are available: one for Illumina paired-end reads in the “fastq.gz” file format and the other for Ion Torrent reads in the “ubam” file format.</p>
        <p>The software is designed to process several samples in a single run. All reads (paired or unpaired) must be copied into the same working directory, and then, the program is launched through the command line by typing “StartEasyTorrent” for IonTorrent input or “StartEasyIllumina” for Illumina input. The pipeline than performs all the other passages automatically, as described in the following paragraphs.</p>
        <p>The program processes all input reads, dividing them into different samples using file names as identifiers. Illumina paired-end reads are expected to be divided into 2 files that contain “R1” or “R2” to distinguish forward reads from reverse reads.</p>
        <p>Sample preprocessing is performed by filtering out all reads with a mean Phred quality score lower than 20 and that are less than 30 nucleotides long.</p>
        <p>Filtered reads are mapped on the SARS-CoV-2 reference genome Wuhan-Hu-1 (GenBank Accession Number NC_045512.2) with bwa-mem software [<xref ref-type="bibr" rid="ref15">15</xref>]; all reads that do not map on the reference genome are then discarded.</p>
        <p>Genome coverage is then analyzed: The read-mapping file is converted into “sorted-bam” and “mpileup” files using samtools software [<xref ref-type="bibr" rid="ref19">19</xref>], and these data are translated into a detailed coverage table that reports the count of nucleotides observed at each position.</p>
        <p>The consensus sequence is then reconstructed on the basis of 3 parameters: (1) frequency of nucleotides observed at each position, (2) nucleotide coverage, (3) reference genome sequence.</p>
        <p>Briefly, sample parameters for consensus sequence reconstruction are designed to call the nucleotide observed with &gt;50% frequency and with a coverage of &gt;50 reads, but the minimum coverage is reduced at &gt;10 reads if the most frequent nucleotide observed is identical to the nucleotide observed in the reference genome.</p>
        <p>For all positions where these parameters are not satisfied, the ESCA pipeline is designed to call “N” to indicate a low coverage position or an intrasample nucleotide variant.</p>
        <p>After whole genome reconstruction of all samples, the consensus sequences are aligned with the Wuhan-Hu-1 reference genome using MAFFT software [<xref ref-type="bibr" rid="ref20">20</xref>], and a mutation table is generated, reporting nucleotide mutations of all the genomes assembled.</p>
      </sec>
      <sec>
        <title>Illumina Data</title>
        <p>To test the efficiency of the ESCA pipeline, 228 SARS-CoV-2–positive samples were sequenced with Illumina platforms using the Ion AmpliSeq SARS-CoV-2 Research Panel following the manufacturer’s instructions (ThermoFisher, Waltham, MA). For Illumina samples, whole SARS-CoV-2 genome sequences were assembled using both ESCA and DRAGEN RNA Pathogen Detection v.3.5.15 (BaseSpace) with default parameters.</p>
      </sec>
      <sec>
        <title>Ion Torrent Data</title>
        <p>A resequencing assay on Ion Torrent platforms was carried out for the same 228 SARS-CoV-2–positive samples using the Ion AmpliSeq SARS-CoV-2 Research Panel following the manufacturer’s instructions (ThermoFisher).</p>
        <p>For Ion Torrent samples, whole SARS-CoV-2 genome sequences were assembled with ESCA and IRMA software [<xref ref-type="bibr" rid="ref18">18</xref>] using the setting parameters indicated by ThermoFisher, in order to test the consistency of ESCA and IRMA outputs.</p>
      </sec>
      <sec>
        <title>Performance Test</title>
        <p>The respective results were compared, aligning the sequences obtained using the 2 methods with the reference sequence Wuhan-Hu-1 (NCBI Acc. Numb. NC_045512.2), and the corrected sequence was submitted to GISAID, using MAFFT [<xref ref-type="bibr" rid="ref20">20</xref>]. Then, each discordant position was evaluated following the classification reported in <xref rid="figure1" ref-type="fig">Figure 1</xref>. In particular, we evaluated true positives (TP; mutations correctly classified as real); false negatives (FN; mutations correctly classified as unreal); false positives (FP; mutations incorrectly classified as real); true negatives (TN; mutations correctly classified as unreal); corrected TN (positions unknown correctly classified as N); and TN error (positions unknown, incorrectly classified as N).</p>
        <p>To test the performances with respect to mean coverage, linear regression correlation analysis was carried out for mean coverage and specific measures of accuracy.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Classification scheme for genome assemblers, in which assembled genome sequences (SEQ) were compared with the corresponding submitted sequences (on GISAID) and with reference genome sequence “Wuhan-Hu-1” (REF). Nucleotide threesomes were classified using the following 11 categories: false deletion (Fd), false insertion (Fi), false negative (FN), false positive (FP), mutation error (Me), N correct (Nc), N error (Ne), true deletion (Td), true insertion (Ti), true negative (TN), true positive (TP).</p>
          </caption>
          <graphic xlink:href="bioinform_v3i1e31536_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>In the computational evaluation, ESCA software was compared with the most often used assemblers for SARS-CoV-2 genome analysis on 228 SARS-CoV-2–positive samples.</p>
      <p>Sequencing was performed on Illumina MiSeq for 65 libraries, obtaining a median of 1.50 x 106 paired-end reads per sample (range: 0.02 x 106 to 4.56 x 106), and on Ion Gene Studio S5 Sequencer for 163 libraries, obtaining a median of 0.61 x 106 single-end reads per sample (range: 0.02 x 106 to 3.02 x 106). Using the ESCA reconstruction, the coverage point by point was calculated, and we observed that, in the Illumina sample, the point coverage was not uniform, although the mean coverage was quite high in all samples (average 3508X; range: 70-10,733). This could introduce error in genome reconstruction using some software. In this context, ESCA could reduce the error in regions with low coverage. In parallel, mean coverage obtained with Ion Torrent was 4966X (range: 94-19,917), but a higher uniformity was observed. The comparison of the coverage distribution is shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
      <p>To evaluate the ESCA and DRAGEN/IRMA results, assembled genomes, the reference Wuhan-Hu-1, and the corrected genome of GISAID (Accession IDs available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) were aligned with MAFFT [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
      <p>At each position along the SARS-CoV-2 genome, the 24 available nucleotide combinations were classified in 11 mutation categories (<xref rid="figure1" ref-type="fig">Figure 1</xref>). For all sequences, the number of occurrences of mutation categories for each assembly software was then evaluated.</p>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Comparison of true positive mutations between our Easy-to-use SARS-CoV-2 Assembler (ESCA) and the (A) Illumina DRAGEN tool and (B) iterative refinement meta-assembler (IRMA) recommended by Ion Torrent.</p>
        </caption>
        <graphic xlink:href="bioinform_v3i1e31536_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <sec>
        <title>Illumina Data</title>
        <p>The comparison of ESCA with DRAGEN showed that, as expected, the mean number of mutations in genomes was very low (in the mean 28 position) and ESCA could correctly identify a mean 27 of 28 mutations (<xref rid="figure2" ref-type="fig">Figure 2</xref>A). Moreover, no FN positions were identified by ESCA. This is due to the pipeline design that reduces the error of introducing N where the coverage is not sufficient. The DRAGEN genome, instead, showed a mean of 25 of 28 TP and 3 FN positions. The absence of a mutation in specific positions could be essential to assigning the lineage, and the presence of FNs could modify the identification of the variants.</p>
        <p>On the other hand, both ESCA and DRAGEN did not introduce FN, identifying 29,308 and 28,027 TN positions, respectively.</p>
        <p>These results show an accuracy of 100% for ESCA and 99.99% for DRAGEN. Moreover, the sensitivity of ESCA compared with DRAGEN was 96.43% for ESCA and 89.29% for DRAGEN, and the specificity with both methods was 100%.</p>
      </sec>
      <sec>
        <title>Ion Torrent Data</title>
        <p>Parallel to the previous comparison, ESCA compared with IRMA showed that both methods identified a mean 25 of 26 TP positions (<xref rid="figure2" ref-type="fig">Figure 2</xref>B) but did not induce FN. However, IRMA introduced a certain number of errors. In fact, the FP was 20 for IRMA, compared with 0 for ESCA. Once again, the introduction of mutations could induce error in the lineage assignation.</p>
        <p>The accuracy of IRMA was calculated to be 99.93%, while it was 100% for ESCA.</p>
        <p>Moreover, although the sensitivity was identical with the 2 methods (96.15%), the specificity was 99.93% for IRMA and 100% for ESCA.</p>
      </sec>
      <sec>
        <title>Performance Test</title>
        <p>To evaluate the performance of each of the methods, linear regression correlation analysis was carried out with respect to mean coverage (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p>
        <p>For IonTorrent single-end sequencing data, a significant positive correlation was found comparing coverage and TN for both IRMA and ESCA (r&gt;0.15, <italic>P</italic>&lt;.05), while for Illumina pair-end sequencing data, such a correlation was found only for DRAGEN (r&gt;0.40, <italic>P</italic>&lt;.05). This difference could be caused by a different error rate for the 2 sequencing techniques. These data suggest that all assembly methods are comparable in the case of high coverage samples, while ESCA seems to perform better for low coverage data.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The importance of rapidly obtaining and sharing high-quality whole genomes of SARS-CoV-2 is increasing with the emerging variant strains [<xref ref-type="bibr" rid="ref14">14</xref>]. For this reason, the use of NGS custom amplicon panels can be a rapid and performant method for identifying viral variants. However, a lack of bioinformatic skills could be a problem in handling NGS raw data. Our pipeline ESCA provides help to laboratories with low bioinformatic capacity using a single command. Both of the more common methods for the analysis of Ion Torrent and Illumina data (IRMA and DRAGEN, respectively) have shown a certain amount of error that could induce false identification in variant assignation. On the contrary, the SARS-CoV-2 genome obtained by ESCA shows a reduced number of false insertions and false mutations and a higher number of real mutations.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This pipeline should be tested on a larger number of sequences and with other sequencing technologies.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>ESCA automatically produces a variant table output file, fundamental for rapidly recognizing variants of interest.</p>
        <p>These results show how ESCA could be a useful method for obtaining a rapid, complete, and correct analysis even with minimal skill in bioinformatics.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Comparison of Easy-to-use SARS-CoV-2 Assembler (ESCA) and (first tab: Ion Torrent) iterative refinement meta-assembler (IRMA) and (second tab: Illumina) DRAGEN results for every assembled SARS-CoV-2 genome. DELerror: deletion unknown incorrectly identified; errorMut: number of incorrected mutations described; FN: false negative; FP: false positive; INScorr: insertion unknown correctly identified; INSerror: insertion unknown incorrectly identified; NCorr: positions unknown correctly classified as N; Nerror: position unknown incorrectly classified as N; TN: true negative; TP: true positive.</p>
        <media xlink:href="bioinform_v3i1e31536_app1.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 36 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Pairwise linear regression correlation analysis (shown with the <italic>P</italic> value) for every parameter: DELerror: deletion unknown incorrectly identified; FN: false negative; FP: false positive; INScorr: insertion unknown correctly identified; INSerror: insertion unknown incorrectly identified; NCorr: positions unknown correctly classified as N; Nerror: position unknown incorrectly classified as N; TN: true negative; TP: true positive.</p>
        <media xlink:href="bioinform_v3i1e31536_app2.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 41 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACE2</term>
          <def>
            <p>angiotensin-converting enzyme 2</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CDC</term>
          <def>
            <p>Centers for Disease Control and Prevention</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ESCA</term>
          <def>
            <p>Easy-to-use SARS-CoV-2 Assembler</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">FN</term>
          <def>
            <p>false negative</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">FP</term>
          <def>
            <p>false positive</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">IRMA</term>
          <def>
            <p>iterative refinement meta-assembler</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">NGS</term>
          <def>
            <p>next-generation sequencing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">TN</term>
          <def>
            <p>true negative</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">TP</term>
          <def>
            <p>true positive</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We gratefully acknowledge the contributors of the genome sequences of the newly emerging coronavirus (ie, the originating laboratories) for sharing sequences and other metadata through the GISAID Initiative, on which this research is based. We also acknowledge Ornella Butera, Francesco Santini, and Giulia Bonfiglio for their contribution to sample preparation. National Institute for Infectious Diseases Lazzaro Spallanzani IRCCS received financial support from the Italian Ministry of Health grants “Ricerca Corrente” (Progetto 1-2763705) and “5 PER MILLE 2020” (iSNV study for early detection and risk analysis of SARS-CoV-2 mutations with impact on clinical management of COVID-19) research funds.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>World Health Organization (WHO)</collab>
          </person-group>
          <article-title>Genomic sequencing of SARS-CoV-2: a guide to implementation for maximum impact on public health</article-title>
          <source>World Health Organization</source>
          <year>2021</year>
          <month>01</month>
          <day>08</day>
          <access-date>2022-02-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/publications/i/item/9789240018440">https://www.who.int/publications/i/item/9789240018440</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greaney</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Loes</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Crawford</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Starr</surname>
              <given-names>TN</given-names>
            </name>
            <name name-style="western">
              <surname>Malone</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Bloom</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Comprehensive mapping of mutations in the SARS-CoV-2 receptor-binding domain that affect recognition by polyclonal human plasma antibodies</article-title>
          <source>Cell Host Microbe</source>
          <year>2021</year>
          <month>03</month>
          <day>10</day>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>463</fpage>
          <lpage>476.e6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33592168"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chom.2021.02.003</pub-id>
          <pub-id pub-id-type="medline">33592168</pub-id>
          <pub-id pub-id-type="pii">S1931-3128(21)00082-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC7869748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>GJD</given-names>
            </name>
            <name name-style="western">
              <surname>Vijaykrishna</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bahl</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lycett</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Worobey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pybus</surname>
              <given-names>OG</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Raghwani</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatt</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Peiris</surname>
              <given-names>JSM</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rambaut</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Origins and evolutionary genomics of the 2009 swine-origin H1N1 influenza A epidemic</article-title>
          <source>Nature</source>
          <year>2009</year>
          <month>06</month>
          <day>25</day>
          <volume>459</volume>
          <issue>7250</issue>
          <fpage>1122</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1038/nature08182</pub-id>
          <pub-id pub-id-type="medline">19516283</pub-id>
          <pub-id pub-id-type="pii">nature08182</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Revez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Espinosa</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Albiger</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Leitmeyer</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Struelens</surname>
              <given-names>MJ</given-names>
            </name>
            <collab>ECDC National Microbiology Focal Points and Experts Group</collab>
          </person-group>
          <article-title>Survey on the use of whole-genome sequencing for infectious diseases surveillance: rapid expansion of European National Capacities, 2015-2016</article-title>
          <source>Front Public Health</source>
          <year>2017</year>
          <volume>5</volume>
          <fpage>347</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fpubh.2017.00347"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2017.00347</pub-id>
          <pub-id pub-id-type="medline">29326921</pub-id>
          <pub-id pub-id-type="pmcid">PMC5741818</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nadon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Van Walle</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Gerner-Smidt</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Campos</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chinen</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Concepcion-Acevedo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gilpin</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Man Kam</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Perez</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Trees</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kubota</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Takkinen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Carleton</surname>
              <given-names>H</given-names>
            </name>
            <collab>FWD-NEXT Expert Panel</collab>
          </person-group>
          <article-title>PulseNet International: Vision for the implementation of whole genome sequencing (WGS) for global food-borne disease surveillance</article-title>
          <source>Euro Surveill</source>
          <year>2017</year>
          <month>06</month>
          <day>08</day>
          <volume>22</volume>
          <issue>23</issue>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.eurosurveillance.org/ViewArticle.aspx?ArticleId=22807"/>
          </comment>
          <pub-id pub-id-type="doi">10.2807/1560-7917.ES.2017.22.23.30544</pub-id>
          <pub-id pub-id-type="medline">28662764</pub-id>
          <pub-id pub-id-type="pii">30544</pub-id>
          <pub-id pub-id-type="pmcid">PMC5479977</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elbe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Buckland-Merrett</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Data, disease and diplomacy: GISAID's innovative contribution to global health</article-title>
          <source>Glob Chall</source>
          <year>2017</year>
          <month>01</month>
          <day>10</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>33</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/gch2.1018"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/gch2.1018</pub-id>
          <pub-id pub-id-type="medline">31565258</pub-id>
          <pub-id pub-id-type="pii">GCH21018</pub-id>
          <pub-id pub-id-type="pmcid">PMC6607375</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>NCBI Resource Coordinators</collab>
          </person-group>
          <article-title>Database resources of the National Center for Biotechnology Information</article-title>
          <source>Nucleic Acids Res</source>
          <year>2018</year>
          <month>01</month>
          <day>04</day>
          <volume>46</volume>
          <issue>D1</issue>
          <fpage>D8</fpage>
          <lpage>D13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29140470"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkx1095</pub-id>
          <pub-id pub-id-type="medline">29140470</pub-id>
          <pub-id pub-id-type="pii">4621330</pub-id>
          <pub-id pub-id-type="pmcid">PMC5753372</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>An interactive web-based dashboard to track COVID-19 in real time</article-title>
          <source>Lancet Infect Dis</source>
          <year>2020</year>
          <month>05</month>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>533</fpage>
          <lpage>534</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32087114"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="medline">32087114</pub-id>
          <pub-id pub-id-type="pii">S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7159018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hadfield</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Megill</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Huddleston</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Potter</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Callender</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sagulenko</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bedford</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Neher</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Nextstrain: real-time tracking of pathogen evolution</article-title>
          <source>Bioinformatics</source>
          <year>2018</year>
          <month>12</month>
          <day>01</day>
          <volume>34</volume>
          <issue>23</issue>
          <fpage>4121</fpage>
          <lpage>4123</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29790939"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/bty407</pub-id>
          <pub-id pub-id-type="medline">29790939</pub-id>
          <pub-id pub-id-type="pii">5001388</pub-id>
          <pub-id pub-id-type="pmcid">PMC6247931</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rambaut</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>O'Toole</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>McCrone</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Ruis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>du Plessis</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pybus</surname>
              <given-names>OG</given-names>
            </name>
          </person-group>
          <article-title>A dynamic nomenclature proposal for SARS-CoV-2 lineages to assist genomic epidemiology</article-title>
          <source>Nat Microbiol</source>
          <year>2020</year>
          <month>11</month>
          <volume>5</volume>
          <issue>11</issue>
          <fpage>1403</fpage>
          <lpage>1407</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32669681"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41564-020-0770-5</pub-id>
          <pub-id pub-id-type="medline">32669681</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41564-020-0770-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7610519</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
          <source>Outbreak.info</source>
          <access-date>2022-02-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://outbreak.info/">https://outbreak.info/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cameroni</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bowen</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Rosen</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Saliba</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zepeda</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Culap</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pinto</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>VanBlargan</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>De Marco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>di Iulio</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zatta</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Noack</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Farhat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Czudnochowski</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Havenar-Daughton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sprouse</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Dillen</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Powell</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Maher</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Soriaga</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bassi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Silacci-Fregni</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gustafsson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Franko</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Logue</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Iqbal</surname>
              <given-names>NT</given-names>
            </name>
            <name name-style="western">
              <surname>Mazzitelli</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Geffner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grifantini</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gori</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Riva</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giannini</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Ceschi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrari</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cippà</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Franzetti-Pellanda</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garzoni</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Halfmann</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kawaoka</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hebner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Purcell</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Piccoli</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pizzuto</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Walls</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Diamond</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Telenti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Virgin</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Lanzavecchia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Snell</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Veesler</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Corti</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Broadly neutralizing antibodies overcome SARS-CoV-2 Omicron antigenic shift</article-title>
          <source>Nature</source>
          <year>2022</year>
          <month>02</month>
          <day>10</day>
          <volume>602</volume>
          <issue>7898</issue>
          <fpage>664</fpage>
          <lpage>670</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33592168"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-021-04386-2</pub-id>
          <pub-id pub-id-type="medline">35016195</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-021-04386-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC7869748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Focosi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Maggi</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Neutralising antibody escape of SARS-CoV-2 spike protein: Risk assessment for antibody-based Covid-19 therapeutics and vaccines</article-title>
          <source>Rev Med Virol</source>
          <year>2021</year>
          <month>11</month>
          <volume>31</volume>
          <issue>6</issue>
          <fpage>e2231</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33724631"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/rmv.2231</pub-id>
          <pub-id pub-id-type="medline">33724631</pub-id>
          <pub-id pub-id-type="pmcid">PMC8250244</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <article-title>SARS-CoV-2 genomic sequencing for public health goals: Interim guidance, 8 January 2021</article-title>
          <source>World Health Organization</source>
          <year>2021</year>
          <month>01</month>
          <day>08</day>
          <access-date>2022-02-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/publications/i/item/WHO-2019-nCoV-genomic_sequencing-2021.1">https://www.who.int/publications/i/item/WHO-2019-nCoV-genomic_sequencing-2021.1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Durbin</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Fast and accurate short read alignment with Burrows-Wheeler transform</article-title>
          <source>Bioinformatics</source>
          <year>2009</year>
          <month>07</month>
          <day>15</day>
          <volume>25</volume>
          <issue>14</issue>
          <fpage>1754</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19451168"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btp324</pub-id>
          <pub-id pub-id-type="medline">19451168</pub-id>
          <pub-id pub-id-type="pii">btp324</pub-id>
          <pub-id pub-id-type="pmcid">PMC2705234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al Qaffas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nichols</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ourahmane</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hertel</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McVoy</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Camiolo</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>LoReTTA, a user-friendly tool for assembling viral genomes from PacBio sequence data</article-title>
          <source>Virus Evol</source>
          <year>2021</year>
          <month>01</month>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>veab042</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33996146"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/ve/veab042</pub-id>
          <pub-id pub-id-type="medline">33996146</pub-id>
          <pub-id pub-id-type="pii">veab042</pub-id>
          <pub-id pub-id-type="pmcid">PMC8111061</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al Kadi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ito</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kameoka</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hishida</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Motooka</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Iida</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Okuzaki</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>UNAGI: an automated pipeline for nanopore full-length cDNA sequencing uncovers novel transcripts and isoforms in yeast</article-title>
          <source>Funct Integr Genomics</source>
          <year>2020</year>
          <month>07</month>
          <day>18</day>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>523</fpage>
          <lpage>536</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31955296"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10142-020-00732-1</pub-id>
          <pub-id pub-id-type="medline">31955296</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10142-020-00732-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7283198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shepard</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Meno</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bahl</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Neuhaus</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Viral deep sequencing needs an adaptive approach: IRMA, the iterative refinement meta-assembler</article-title>
          <source>BMC Genomics</source>
          <year>2016</year>
          <month>09</month>
          <day>05</day>
          <volume>17</volume>
          <fpage>708</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcgenomics.biomedcentral.com/articles/10.1186/s12864-016-3030-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12864-016-3030-6</pub-id>
          <pub-id pub-id-type="medline">27595578</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12864-016-3030-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC5011931</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Handsaker</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wysoker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fennell</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ruan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Homer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Marth</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Abecasis</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Durbin</surname>
              <given-names>R</given-names>
            </name>
            <collab>1000 Genome Project Data Processing Subgroup</collab>
          </person-group>
          <article-title>The Sequence Alignment/Map format and SAMtools</article-title>
          <source>Bioinformatics</source>
          <year>2009</year>
          <month>08</month>
          <day>15</day>
          <volume>25</volume>
          <issue>16</issue>
          <fpage>2078</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19505943"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id>
          <pub-id pub-id-type="medline">19505943</pub-id>
          <pub-id pub-id-type="pii">btp352</pub-id>
          <pub-id pub-id-type="pmcid">PMC2723002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Katoh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Misawa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kuma</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Miyata</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>MAFFT: a novel method for rapid multiple sequence alignment based on fast Fourier transform</article-title>
          <source>Nucleic Acids Res</source>
          <year>2002</year>
          <month>07</month>
          <day>15</day>
          <volume>30</volume>
          <issue>14</issue>
          <fpage>3059</fpage>
          <lpage>66</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/12136088"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkf436</pub-id>
          <pub-id pub-id-type="medline">12136088</pub-id>
          <pub-id pub-id-type="pmcid">PMC135756</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
