<!DOCTYPE article
PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD with MathML3 v1.2 20190208//EN" "JATS-archivearticle1-mathml3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" article-type="research-article"><?properties open_access?><front><journal-meta><journal-id journal-id-type="nlm-ta">Emerg Infect Dis</journal-id><journal-id journal-id-type="iso-abbrev">Emerg Infect Dis</journal-id><journal-id journal-id-type="publisher-id">EID</journal-id><journal-title-group><journal-title>Emerging Infectious Diseases</journal-title></journal-title-group><issn pub-type="ppub">1080-6040</issn><issn pub-type="epub">1080-6059</issn><publisher><publisher-name>Centers for Disease Control and Prevention</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="pmid">33900175</article-id><article-id pub-id-type="pmc">8084492</article-id><article-id pub-id-type="publisher-id">20-4579</article-id><article-id pub-id-type="doi">10.3201/eid2705.204579</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research</subject></subj-group><subj-group subj-group-type="article-type"><subject>Research</subject></subj-group><subj-group subj-group-type="TOC-title"><subject>Use of Genomics to Track Coronavirus Disease Outbreaks, New Zealand</subject></subj-group></article-categories><title-group><article-title>Use of Genomics to Track Coronavirus Disease Outbreaks, New Zealand</article-title><alt-title alt-title-type="running-head">Genomics to Track Coronavirus Disease Outbreaks</alt-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name><surname>Geoghegan</surname><given-names>Jemma L.</given-names></name><xref ref-type="fn" rid="FN1"><sup>1</sup></xref></contrib><contrib contrib-type="author"><name><surname>Douglas</surname><given-names>Jordan</given-names></name><xref ref-type="fn" rid="FN1"><sup>1</sup></xref></contrib><contrib contrib-type="author"><name><surname>Ren</surname><given-names>Xiaoyun</given-names></name></contrib><contrib contrib-type="author"><name><surname>Storey</surname><given-names>Matthew</given-names></name></contrib><contrib contrib-type="author"><name><surname>Hadfield</surname><given-names>James</given-names></name></contrib><contrib contrib-type="author"><name><surname>Silander</surname><given-names>Olin K.</given-names></name></contrib><contrib contrib-type="author"><name><surname>Freed</surname><given-names>Nikki E.</given-names></name></contrib><contrib contrib-type="author"><name><surname>Jelley</surname><given-names>Lauren</given-names></name></contrib><contrib contrib-type="author"><name><surname>Jefferies</surname><given-names>Sarah</given-names></name></contrib><contrib contrib-type="author"><name><surname>Sherwood</surname><given-names>Jillian</given-names></name></contrib><contrib contrib-type="author"><name><surname>Paine</surname><given-names>Shevaun</given-names></name></contrib><contrib contrib-type="author"><name><surname>Huang</surname><given-names>Sue</given-names></name></contrib><contrib contrib-type="author"><name><surname>Sporle</surname><given-names>Andrew</given-names></name></contrib><contrib contrib-type="author"><name><surname>Baker</surname><given-names>Michael G.</given-names></name></contrib><contrib contrib-type="author"><name><surname>Murdoch</surname><given-names>David R.</given-names></name></contrib><contrib contrib-type="author"><name><surname>Drummond</surname><given-names>Alexei J.</given-names></name></contrib><contrib contrib-type="author"><name><surname>Welch</surname><given-names>David</given-names></name></contrib><contrib contrib-type="author"><name><surname>Simpson</surname><given-names>Colin R.</given-names></name></contrib><contrib contrib-type="author"><name><surname>French</surname><given-names>Nigel</given-names></name></contrib><contrib contrib-type="author"><name><surname>Holmes</surname><given-names>Edward C.</given-names></name></contrib><contrib contrib-type="author"><name><surname>de Ligt</surname><given-names>Joep</given-names></name></contrib><aff id="aff1">University of Otago, Dunedin, New Zealand (J.L. Geoghegan); </aff><aff id="aff2">Institute of Environmental Science and Research, Wellington, New Zealand (J.L. Geoghegan, X. Ren, M. Storey, L. Jelley, S. Jefferies, J. Sherwood, S. Paine, S. Huang, J. de Ligt); </aff><aff id="aff3">University of Auckland, Auckland, New Zealand. (J. Douglas, A. Sporle, A.J. Drummond, D. Welch); </aff><aff id="aff4">Fred Hutchinson Cancer Research Centre, Seattle, Washington, USA (J. Hadfield); </aff><aff id="aff5">Massey University, Auckland (O.K. Silander, N.E. Freed); </aff><aff id="aff6">iNZight Analytics Ltd., Auckland (A. Sporle); </aff><aff id="aff7">University of Otago, Wellington (M.G. Baker); </aff><aff id="aff8">University of Otago, Christchurch, New Zealand (D.R. Murdoch); </aff><aff id="aff9">Victoria University of Wellington, Wellington (C.R. Simpson); </aff><aff id="aff10">University of Edinburgh, Edinburgh, Scotland, UK (C.R. Simpson); </aff><aff id="aff11">Massey University, Palmerston North, New Zealand (N. French); T</aff><aff id="aff12">he University of Sydney, Sydney, New South Wales, Australia (E.C. Holmes)</aff></contrib-group><author-notes><corresp id="cor1">Address for correspondence: Jemma L. Geoghegan, University of Otago Division of Health Sciences, Microbiology and Immunology, 720 Cumberland St, Dunedin, Otago 9054, New Zealand; email: <email xlink:href="jemma.geoghegan@otago.ac.nz">jemma.geoghegan@otago.ac.nz</email></corresp></author-notes><pub-date pub-type="ppub"><month>5</month><year>2021</year></pub-date><volume>27</volume><issue>5</issue><fpage>1317</fpage><lpage>1322</lpage><abstract><p>Real-time genomic sequencing has played a major role in tracking the global spread of severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2), contributing greatly to disease mitigation strategies. In August 2020, after having eliminated the virus, New Zealand experienced a second outbreak. During that outbreak, New Zealand used genomic sequencing in a primary role, leading to a second elimination of the virus. We generated genomes from 78% of the laboratory-confirmed samples of SARS-CoV-2 from the second outbreak and compared them with the available global genomic data. Genomic sequencing rapidly identified that virus causing the second outbreak in New Zealand belonged to a single cluster, thus resulting from a single introduction. However, successful identification of the origin of this outbreak was impeded by substantial biases and gaps in global sequencing data. Access to a broader and more heterogenous sample of global genomic data would strengthen efforts to locate the source of any new outbreaks.</p></abstract><kwd-group kwd-group-type="author"><title>Keywords: </title><kwd>2019 novel coronavirus disease</kwd><kwd>coronavirus disease</kwd><kwd>COVID-19</kwd><kwd>severe acute respiratory syndrome coronavirus 2</kwd><kwd>SARS-CoV-2</kwd><kwd>viruses</kwd><kwd>respiratory infections</kwd><kwd>zoonoses</kwd><kwd>genomics</kwd><kwd>infectious disease</kwd><kwd>New Zealand</kwd></kwd-group></article-meta></front><body><p>A genome of the novel severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2) was published only 12 days after the virus was identified (<xref rid="R1" ref-type="bibr"><italic>1</italic></xref>). This information was pivotal to the subsequent rapid development of diagnostic tests and identification of potential treatments (<xref rid="R2" ref-type="bibr"><italic>2</italic></xref>,<xref rid="R3" ref-type="bibr"><italic>3</italic></xref>). As of January 2021, &#x02248;400,000 genomes of SARS-CoV-2 had been shared publicly (<xref rid="R4" ref-type="bibr"><italic>4</italic></xref>). The underlying genome sequencing was performed so rapidly that during this infectious disease outbreak, virologic and epidemiologic data could be integrated in real time (<xref rid="R5" ref-type="bibr"><italic>5</italic></xref>). Analysis of these data also played a role in informing the coronavirus disease (COVID-19) response by tracking the global spread and evolution of SARS-CoV-2, including identification of the number, source, and timing of introductions into individual countries, leading to a greater understanding of COVID-19 outbreaks around the world (<xref rid="R6" ref-type="bibr"><italic>6</italic></xref>&#x02013;<xref rid="R9" ref-type="bibr"><italic>9</italic></xref>; A.D.S. Filipe et al., unpub. data, <ext-link ext-link-type="uri" xlink:href="https://www.medrxiv.org/content/10.1101/2020.06.08.20124834v1">https://www.medrxiv.org/content/10.1101/2020.06.08.20124834v1</ext-link>; T. Seemann et al., unpub. data, <ext-link ext-link-type="uri" xlink:href="https://www.medrxiv.org/content/10.1101/2020.05.12.20099929v1">https://www.medrxiv.org/content/10.1101/2020.05.12.20099929v1</ext-link>; L. Zhang et al., unpub. data, <ext-link ext-link-type="uri" xlink:href="https://www.biorxiv.org/content/10.1101/2020.06.12.148726v1">https://www.biorxiv.org/content/10.1101/2020.06.12.148726v1</ext-link>; J. Douglas et al., unpub. data, <ext-link ext-link-type="uri" xlink:href="https://www.medrxiv.org/content/10.1101/2020.08.04.20168518v1">https://www.medrxiv.org/content/10.1101/2020.08.04.20168518v1</ext-link>).</p><p>As of January 2021, of the 219 countries that had reported positive cases of COVID-19 to the World Health Organization (WHO) (<xref rid="R10" ref-type="bibr"><italic>10</italic></xref>), 65% (n = 142) had sequenced and shared SARS-CoV-2 genomes on the GISAID database (<ext-link ext-link-type="uri" xlink:href="https://www.gisaid.org">https://www.gisaid.org</ext-link>) (<xref rid="R4" ref-type="bibr"><italic>4</italic></xref>). This immense global sequencing effort has enhanced ongoing genomic surveillance of the pandemic, including the monitoring of viral genetic changes of interest (L. Zhang et al., unpub. data, <ext-link ext-link-type="uri" xlink:href="https://www.biorxiv.org/content/10.1101/2020.06.12.148726v1">https://www.biorxiv.org/content/10.1101/2020.06.12.148726v1</ext-link>) and informing public health responses (<xref rid="R11" ref-type="bibr"><italic>11</italic></xref>&#x02013;<xref rid="R14" ref-type="bibr"><italic>14</italic></xref>). Nevertheless, the number and proportion of SARS-CoV-2 genomes from COVID-19 case-patients that were sequenced, and genomes published, varies dramatically between countries and over time (<xref ref-type="fig" rid="F1">Figure 1</xref>). For example, the COVID-19 Genomics UK Consortium (<ext-link ext-link-type="uri" xlink:href="https://www.cogconsortium.uk">https://www.cogconsortium.uk</ext-link>) has led to the United Kingdom being the most represented sampling location, totaling &#x02248;180,000 genomes and comprising 44% of the global dataset despite recording only &#x02248;4% of the world&#x02019;s positive cases (n = 3,669,658). Conversely, SARS-CoV-2 genomes sequenced in India represent just 1% of the global dataset but 11% of the world&#x02019;s total reported cases (n = 10,677,710).</p><fig id="F1" fig-type="figure" position="float"><label>Figure 1</label><caption><p>Sequenced and published genomes of global severe acute respiratory syndrome coronavirus 2 isolates. A) Proportion of global cases sequenced and shared on GISAID (<ext-link ext-link-type="uri" xlink:href="https://www.gisaid.org">https://www.gisaid.org</ext-link>) from December 2019 through January 2021, for which the second mode was largely driven by COG-UK as illustrated. B) Number of genomes sequenced and number of reported cases per country on a linear scale. Red, New Zealand (NZ); blue, other countries. C) Number of genomes sequenced and number of reported cases per country on a logarithmic scale. COG-UK, COVID-19 Genomics UK Consortium (<ext-link ext-link-type="uri" xlink:href="https://www.cogconsortium.uk">https://www.cogconsortium.uk</ext-link>); UK, United Kingdom; US, United States.</p></caption><graphic xlink:href="20-4579-F1"/></fig><p>Such disparate sequencing efforts can have major implications for data interpretation and must be carefully considered. Real-time sequencing of SARS-CoV-2 genomes has, however, been particularly useful for tracking the re-emergence of the virus in New Zealand. By June 2020, New Zealand had effectively eliminated COVID-19 in the community and positive cases were limited to those linked to managed quarantine facilities at the border (<xref rid="R7" ref-type="bibr"><italic>7</italic></xref>,<xref rid="R15" ref-type="bibr"><italic>15</italic></xref>; J. Douglas et al., unpub. data, <ext-link ext-link-type="uri" xlink:href="https://www.medrxiv.org/content/10.1101/2020.08.04.20168518v1">https://www.medrxiv.org/content/10.1101/2020.08.04.20168518v1</ext-link>). After &#x02248;100 days with no detected community transmission of COVID-19, on August 11, 2020, four new cases emerged with no apparent epidemiologic link to any known case. We used genomic sequencing of SARS-CoV-2 cases to investigate the probable origins of this outbreak, generating genomes for 78% (n = 140) of the 179 laboratory-confirmed samples from this outbreak.</p><p>We obtained nasopharyngeal samples positive for SARS-CoV-2 by real-time reverse transcription PCR (rRT-PCR) from public health medical diagnostics laboratories located throughout New Zealand. All samples had been de-identified before receipt. Under contract for the New Zealand Ministry of Health, the Institute of Environmental Science and Research (ESR) has approval to conduct genomic sequencing for surveillance of notifiable diseases.</p><sec sec-type="methods"><title>Methods</title><sec><title>Genomic Sequencing</title><p>Of 179 laboratory-confirmed samples of SARS-CoV-2 from the August 2020 outbreak in New Zealand, 172 were received by ESR for whole-genome sequencing. Genome sequencing of SARS-CoV-2 samples was performed as before (<xref rid="R7" ref-type="bibr"><italic>7</italic></xref>). In brief, viral extracts were prepared from respiratory tract samples in which SARS-CoV-2 was detected by rRT-PCR by using World Health Organization&#x02013;recommended primers and probes targeting the envelope and nucleocapsid genes. Extracted RNA from SARS-CoV-2&#x02013;positive samples was subjected to whole-genome sequencing by following the ARTIC network protocol version 3 (<ext-link ext-link-type="uri" xlink:href="https://www.protocols.io/view/ncov-2019-sequencing-protocol-v3-locost-bh42j8ye">https://www.protocols.io/view/ncov-2019-sequencing-protocol-v3-locost-bh42j8ye</ext-link>) and using the Massey University 1200-bp primer set (<ext-link ext-link-type="uri" xlink:href="https://www.protocols.io/view/ncov-2019-sequencing-protocol-rapid-barcoding-1200-bh7hj9j6">https://www.protocols.io/view/ncov-2019-sequencing-protocol-rapid-barcoding-1200-bh7hj9j6</ext-link>) (<xref rid="R16" ref-type="bibr"><italic>16</italic></xref>).</p><p>We used 1 of the tiling amplicon designs to amplify viral cDNA prepared with SuperScript IV (ThermoFisher Scientific, <ext-link ext-link-type="uri" xlink:href="https://www.thermofisher.com">https://www.thermofisher.com</ext-link>). Sequence libraries were then constructed by using Oxford Nanopore Ligation Sequencing and Native Barcoding Expansion kits for samples amplified with the ARTIC version 3 primer sets and the Oxford Nanopore Rapid Barcoding Kit for samples amplified with the 1,200-bp primer sets (<ext-link ext-link-type="uri" xlink:href="https://nanoporetech.com">https://nanoporetech.com</ext-link>). We used the 1,200-bp primers and rapid barcoding when genomes were required urgently. Libraries were sequenced by using R9.4.1 MinION flow cells (Oxford Nanopore). Near-complete (&#x0003e;90% recovered) viral genomes were subsequently assembled through reference mapping. Steps included in the pipeline are described in detail at <ext-link ext-link-type="uri" xlink:href="https://github.com/ESR-NZ/NZ_SARS-CoV-2_genomics">https://github.com/ESR-NZ/NZ_SARS-CoV-2_genomics</ext-link>. The reads generated with Nanopore sequencing using ARTIC primer sets (version 3) were mapped and assembled by using the ARTIC bioinformatics Medaka pipeline version 1.1.0. In total, 140 of 172 genomes from the August 2020 outbreak passed quality control. All data are available on GISAID (<ext-link ext-link-type="uri" xlink:href="https://www.gisaid.org">https://www.gisaid.org</ext-link>).</p></sec><sec><title>Phylogenetic Analysis</title><p>All SARS-CoV-2 genomes from humans, assigned to the B.1.1.1. lineage in the pangolin nomenclature (<xref rid="R17" ref-type="bibr"><italic>17</italic></xref>), were obtained from GISAID (<xref rid="R4" ref-type="bibr"><italic>4</italic></xref>) (n = 7,363 as of January 26, 2021) and subsampled to include 1,996 most recent-in-time sequences to the August 2020 New Zealand outbreak along with 4 outgroup (non-B.1.1.1.) sequences. Sequences were aligned with those from the August 2020 outbreak (n = 140) by using MAFFT version 7 (<xref rid="R18" ref-type="bibr"><italic>18</italic></xref>) and the FFT-NS-2 progressive alignment algorithm (<xref ref-type="local-data" rid="SD1">Appendix 1</xref>). Bayesian phylogenetic analyses were performed by using BEAST 2.5 (<xref rid="R19" ref-type="bibr"><italic>19</italic></xref>). We used a strict clock model with an HKY (Hasegawa, Kishino, and Yano) substitution model (estimated frequencies) for each codon position and 1 for noncoding positions. We used the Bayesian skyline model (<xref rid="R20" ref-type="bibr"><italic>20</italic></xref>) as a tree to allow effective population sizes to change over time intervals. These components of the model and their prior distributions have been previously used (J. Douglas et al., unpub. data, <ext-link ext-link-type="uri" xlink:href="https://www.medrxiv.org/content/10.1101/2020.08.04.20168518v1">https://www.medrxiv.org/content/10.1101/2020.08.04.20168518v1</ext-link>). Phylogenetic trees were annotated by using FigTree version 1.4 (<ext-link ext-link-type="uri" xlink:href="http://tree.bio.ed.ac.uk/software/figtree/">http://tree.bio.ed.ac.uk/software/figtree</ext-link>) and Tree of Life version 4 (<xref rid="R21" ref-type="bibr"><italic>21</italic></xref>).</p></sec></sec><sec sec-type="results"><title>Results</title><p>Of the virus genomes generated in real time for 78% of cases in this cluster, from August 11 through September 14, 2020, when the last case in this outbreak was reported, the maximum distance among the genome was 5 single-nucleotide polymorphisms. When we compared the genomes from patients in the August 2020 New Zealand outbreak with sequenced genomes from patients affected by the first COVID-19 wave in New Zealand and those in quarantine facilities, we found no link. Most available sequence data from case-patients in New Zealand quarantine facilities indicated virus lineages different from those of the August 2020 outbreak. However, this observation was of limited value given that only 42% of case-patients in those quarantine facilities had adequate viral RNA for successful genomic sequencing. To determine the likely origins of this outbreak, we compared genomes from the new community outbreak to the global dataset.</p><p>An initial genomic sequence analysis found that the reemergence of COVID-19 in New Zealand was caused by a SARS-CoV-2 from the (now ancestral) lineage B.1.1.1 of the pangolin nomenclature (<xref rid="R17" ref-type="bibr"><italic>17</italic></xref>). Of the countries that have contributed SARS-CoV-2 data, 30% had genomes of this lineage. Remarkably, 80% of B.1.1.1. genomes were from the United Kingdom and were generated during March 2020&#x02013;January 2021; however, most samples were collected during the first wave of disease in the United Kingdom (<xref ref-type="fig" rid="F2">Figure 2</xref>). Phylogenetic analysis of the most recently sampled B.1.1.1. genomes identified genomes from South Africa, England, and Switzerland in August as the most likely to be contained within the sister clade (<xref ref-type="fig" rid="F2">Figure 2</xref>); these genomes were the closest sampled genomic relatives of the viruses associated with the August 2020 outbreak in New Zealand (<xref ref-type="local-data" rid="SD1">Appendix 2</xref>). Because of the dynamic nature of the pangolin lineage nomenclature, genomes sampled from the August 2020 outbreak in New Zealand are now distinctly classified as lineage C.12, which is now extinct.</p><fig id="F2" fig-type="figure" position="float"><label>Figure 2</label><caption><p>Genomic sequence analyses of global severe acute respiratory syndrome coronavirus 2 isolates. A) Maximum-clade credibility phylogenetic tree of 2,000 subsampled global genomes (1,996 most recently sampled B.1.1.1. plus 4 non-B.1.1.1. used as an outgroup) with an outer ring colored by sampling region. B) Posterior probability of genomes within the sister clade to that of the August 2020 outbreak in New Zealand, color coded by sampling location. C) Proportion of genomes within lineage B.1.1.1. in the global dataset over time, color-coded by sampling location.</p></caption><graphic xlink:href="20-4579-F2"/></fig><p>Additional Bayesian analysis estimated that the outbreak originated 10 days before the first transmission event; the 95% highest posterior density was 0&#x02013;25 days. We also estimated that the first transmission event in the outbreak occurred during July 22&#x02013;August 13, 2020 (95% highest posterior density mean date of August 2). Epidemiologic data showed that 2 confirmed case-patients linked to the outbreak had a symptom onset date of July 31, although the most probable sampled genomes within the sister clade were sampled later, August 6&#x02013;28. Hence, it is unlikely that the currently available global genomic dataset contains the source of this outbreak.</p></sec><sec sec-type="discussion"><title>Discussion</title><p>Genomic epidemiologic analysis of the possible origins of the COVID-19 re-emergence in New Zealand in August 2020 was inconclusive, probably because of missing genomic data within the quarantine border facilities and in the global dataset. A glimpse into the genomic diversity probably omitted from the global dataset can be seen in the genomes sequenced in New Zealand from SARS-CoV-2&#x02013;positive quarantined case-patients, comprising citizens and residents returning from across the globe. For example, 12 SARS-CoV-2 genomes from persons returning to New Zealand from India who arrived on the same flight fell across at least 4 genomic lineages and comprised sequence divergence of up to 34 single-nucleotide polymorphisms (<ext-link ext-link-type="uri" xlink:href="https://www.nextstrain.org">https://www.nextstrain.org</ext-link>). This divergence represented far more genomic mutations than was observed in New Zealand during the first outbreak in March&#x02013;May 2020 (<xref rid="R7" ref-type="bibr"><italic>7</italic></xref>). Such a high level of diversity in just a small sample of SARS-CoV-2&#x02013;positive case-patients from India suggests that the currently available genomic data fail to encompass the true diversity that existed locally, let alone globally.</p><p>The genome sequences identified after the re-emergence of SARS-CoV-2 in New Zealand in August 2020 exemplified one of the most complete genomic datasets for a specific outbreak compiled to date, comprising 78% of positive case-patients (140 of 179 total case-patients SARS-CoV-2 positive by PCR). Real-time genomic sequencing quickly informed track-and-trace efforts to control the outbreak, setting New Zealand on track to eliminate the virus from the community for the second time. The rapid genome sequencing of positive samples provided confidence to public health teams regarding links to the outbreak and identified that cases and subclusters were linked to a single genomic lineage, resulting from a single introduction event. Indeed, the timing and length of lockdown measures were partly informed on the basis of these data. Overall, real-time viral genomics has played a pivotal role in eliminating COVID-19 from New Zealand and has since helped prevent additional regional lockdowns, leading to substantial economic savings.</p><p>Nevertheless, the biased nature of global sampling, including the contribution of very few genome sequences from certain geographic locations, clearly limited the power of genomics to attribute the geographic origin of the August 2020 outbreak in New Zealand. We therefore advocate that potential sampling biases and gaps in available genomic data be carefully considered whenever attempting to determine the geographic origins of a specific SARS-CoV-2 outbreak. Analyses should consider all available evidence, including that from genomic and epidemiologic sources.</p></sec><sec sec-type="supplementary-material"><title/><supplementary-material content-type="local-data" id="SD1"><caption><title>Appendix 1</title><p>List of genomes obtained from GISAID used in analysis of severe acute respiratory syndrome coronavirus 2.</p></caption><media mimetype="application" mime-subtype="excel" xlink:href="20-4579-Techapp-s1.xlsx" xlink:type="simple" id="d39e475" position="anchor"/></supplementary-material><supplementary-material content-type="local-data" id="SD2"><caption><title>Appendix 2</title><p>Phylogenetic tree of severe acute respiratory syndrome coronavirus 2 genomes.</p></caption><media mimetype="application" mime-subtype="pdf" xlink:href="20-4579-Techapp-s2.pdf" xlink:type="simple" id="d39e482" position="anchor"/></supplementary-material></sec></body><back><fn-group><fn fn-type="citation"><p><italic>Suggested citation for this article</italic>: Geoghegan JL, Douglas J, Ren X, Storey M, Hadfield J, Silander OK, et al. Use of genomics to track coronavirus disease outbreaks, New Zealand. Emerg Infect Dis. 2021 May [<italic>date cited</italic>]. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3201/eid2705.204579">https://doi.org/10.3201/eid2705.204579</ext-link></p></fn><fn id="FN1"><label>1</label><p>These authors contributed equally to this article.</p></fn></fn-group><ack><p>This article was preprinted at <ext-link ext-link-type="uri" xlink:href="https://www.medrxiv.org/content/10.1101/2020.10.28.20221853v1">https://www.medrxiv.org/content/10.1101/2020.10.28.20221853v1</ext-link>.</p></ack><ack><title>Acknowledgments</title><p>We thank the ARTIC network for making their protocols and tools openly available and specifically Josh Quick for sending the initial V1 and V3 amplification primers. We thank the diagnostic laboratories that performed the initial rRT-PCRs and referred samples for sequencing as well as the public health units for providing epidemiologic data. We thank Genomics Aotearoa for their support, the NextStrain team for their support and timely global and local analysis, and all those who have contributed SARS-CoV-2 sequences to the GenBank and GISAID databases. We also acknowledge the use of New Zealand eScience Infrastructure (NeSI) high-performance computing facilities.</p><p>This work was funded by the Ministry of Health of New Zealand, New Zealand Ministry of Business, Innovation and Employment COVID-19 Innovation Acceleration Fund (CIAF-0470), ESR Strategic Innovation Fund, and the New Zealand Health Research Council (20/1018 and 20/1041). New Zealand's national facilities are provided by NeSI and funded jointly by NeSI&#x02019;s collaborator institutions and through the Ministry of Business, Innovation and Employment's Research Infrastructure program.</p></ack><bio id="d39e513"><p>Dr. Geoghegan is an evolutionary virologist at the University of Otago, Dunedin, New Zealand, and the Institute of Environmental Science and Research, Wellington, New Zealand. Her research focus is understanding how viruses emerge and spread in new populations.</p></bio><ref-list><title>References</title><ref id="R1"><label>1. </label><mixed-citation publication-type="webpage"><string-name><surname>Holmes</surname>
<given-names>EC</given-names></string-name>. Novel <year>2019</year> coronavirus genome [<comment>cited 2021 Jan 20</comment>]. <ext-link ext-link-type="uri" xlink:href="https://virological.org/t/novel-2019-coronavirus-genome/319">https://virological.org/t/novel-2019-coronavirus-genome/319</ext-link></mixed-citation></ref><ref id="R2"><label>2. </label><mixed-citation publication-type="journal"><string-name><surname>Shin</surname>
<given-names>MD</given-names></string-name>, <string-name><surname>Shukla</surname>
<given-names>S</given-names></string-name>, <string-name><surname>Chung</surname>
<given-names>YH</given-names></string-name>, <string-name><surname>Beiss</surname>
<given-names>V</given-names></string-name>, <string-name><surname>Chan</surname>
<given-names>SK</given-names></string-name>, <string-name><surname>Ortega-Rivera</surname>
<given-names>OA</given-names></string-name>, <etal>et al.</etal>
<article-title>COVID-19 vaccine development and a potential nanomaterial path forward.</article-title>
<source>Nat Nanotechnol</source>. <year>2020</year>;<volume>15</volume>:<fpage>646</fpage>&#x02013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.1038/s41565-020-0737-y</pub-id><pub-id pub-id-type="pmid">32669664</pub-id></mixed-citation></ref><ref id="R3"><label>3. </label><mixed-citation publication-type="journal"><string-name><surname>Stebbing</surname>
<given-names>J</given-names></string-name>, <string-name><surname>Phelan</surname>
<given-names>A</given-names></string-name>, <string-name><surname>Griffin</surname>
<given-names>I</given-names></string-name>, <string-name><surname>Tucker</surname>
<given-names>C</given-names></string-name>, <string-name><surname>Oechsle</surname>
<given-names>O</given-names></string-name>, <string-name><surname>Smith</surname>
<given-names>D</given-names></string-name>, <etal>et al.</etal>
<article-title>COVID-19: combining antiviral and anti-inflammatory treatments.</article-title>
<source>Lancet Infect Dis</source>. <year>2020</year>;<volume>20</volume>:<fpage>400</fpage>&#x02013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30132-8</pub-id><pub-id pub-id-type="pmid">32113509</pub-id></mixed-citation></ref><ref id="R4"><label>4. </label><mixed-citation publication-type="journal"><string-name><surname>Elbe</surname>
<given-names>S</given-names></string-name>, <string-name><surname>Buckland-Merrett</surname>
<given-names>G</given-names></string-name>. <article-title>Data, disease and diplomacy: GISAID&#x02019;s innovative contribution to global health.</article-title>
<source>Glob Chall</source>. <year>2017</year>;<volume>1</volume>:<fpage>33</fpage>&#x02013;<lpage>46</lpage>. <pub-id pub-id-type="doi">10.1002/gch2.1018</pub-id><pub-id pub-id-type="pmid">31565258</pub-id></mixed-citation></ref><ref id="R5"><label>5. </label><mixed-citation publication-type="journal"><string-name><surname>Hadfield</surname>
<given-names>J</given-names></string-name>, <string-name><surname>Megill</surname>
<given-names>C</given-names></string-name>, <string-name><surname>Bell</surname>
<given-names>SM</given-names></string-name>, <string-name><surname>Huddleston</surname>
<given-names>J</given-names></string-name>, <string-name><surname>Potter</surname>
<given-names>B</given-names></string-name>, <string-name><surname>Callender</surname>
<given-names>C</given-names></string-name>, <etal>et al.</etal>
<article-title>Nextstrain: real-time tracking of pathogen evolution.</article-title>
<source>Bioinformatics</source>. <year>2018</year>;<volume>34</volume>:<fpage>4121</fpage>&#x02013;<lpage>3</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty407</pub-id><pub-id pub-id-type="pmid">29790939</pub-id></mixed-citation></ref><ref id="R6"><label>6. </label><mixed-citation publication-type="journal"><string-name><surname>Bedford</surname>
<given-names>T</given-names></string-name>, <string-name><surname>Greninger</surname>
<given-names>AL</given-names></string-name>, <string-name><surname>Roychoudhury</surname>
<given-names>P</given-names></string-name>, <string-name><surname>Starita</surname>
<given-names>LM</given-names></string-name>, <string-name><surname>Famulare</surname>
<given-names>M</given-names></string-name>, <string-name><surname>Huang</surname>
<given-names>M-L</given-names></string-name>, <etal>et al.</etal>; <collab>Seattle Flu Study Investigators</collab>. <article-title>Cryptic transmission of SARS-CoV-2 in Washington state.</article-title>
<source>Science</source>. <year>2020</year>;<volume>370</volume>:<fpage>571</fpage>&#x02013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1126/science.abc0523</pub-id><pub-id pub-id-type="pmid">32913002</pub-id></mixed-citation></ref><ref id="R7"><label>7. </label><mixed-citation publication-type="journal"><string-name><surname>Geoghegan</surname>
<given-names>JL</given-names></string-name>, <string-name><surname>Ren</surname>
<given-names>X</given-names></string-name>, <string-name><surname>Storey</surname>
<given-names>M</given-names></string-name>, <string-name><surname>Hadfield</surname>
<given-names>J</given-names></string-name>, <string-name><surname>Jelley</surname>
<given-names>L</given-names></string-name>, <string-name><surname>Jefferies</surname>
<given-names>S</given-names></string-name>, <etal>et al.</etal>
<article-title>Genomic epidemiology reveals transmission patterns and dynamics of SARS-CoV-2 in Aotearoa New Zealand.</article-title>
<source>Nat Commun</source>. <year>2020</year>;<volume>11</volume>:<fpage>6351</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-20235-8</pub-id><pub-id pub-id-type="pmid">33311501</pub-id></mixed-citation></ref><ref id="R8"><label>8. </label><mixed-citation publication-type="journal"><string-name><surname>Candido</surname>
<given-names>DS</given-names></string-name>, <string-name><surname>Claro</surname>
<given-names>IM</given-names></string-name>, <string-name><surname>de Jesus</surname>
<given-names>JG</given-names></string-name>, <string-name><surname>Souza</surname>
<given-names>WM</given-names></string-name>, <string-name><surname>Moreira</surname>
<given-names>FRR</given-names></string-name>, <string-name><surname>Dellicour</surname>
<given-names>S</given-names></string-name>, <etal>et al.</etal>; <collab>Brazil-UK Centre for Arbovirus Discovery, Diagnosis, Genomics and Epidemiology (CADDE) Genomic Network</collab>. <article-title>Evolution and epidemic spread of SARS-CoV-2 in Brazil.</article-title>
<source>Science</source>. <year>2020</year>;<volume>369</volume>:<fpage>1255</fpage>&#x02013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.1126/science.abd2161</pub-id><pub-id pub-id-type="pmid">32703910</pub-id></mixed-citation></ref><ref id="R9"><label>9. </label><mixed-citation publication-type="journal"><string-name><surname>Eden</surname>
<given-names>J-S</given-names></string-name>, <string-name><surname>Rockett</surname>
<given-names>R</given-names></string-name>, <string-name><surname>Carter</surname>
<given-names>I</given-names></string-name>, <string-name><surname>Rahman</surname>
<given-names>H</given-names></string-name>, <string-name><surname>de Ligt</surname>
<given-names>J</given-names></string-name>, <string-name><surname>Hadfield</surname>
<given-names>J</given-names></string-name>, <etal>et al.</etal>
<article-title>2019-nCoV Study Group. An emergent clade of SARS-CoV-2 linked to returned travellers from Iran.</article-title>
<source>Virus Evol</source>. <year>2020</year>;<volume>6</volume>:<fpage>a027</fpage>. <pub-id pub-id-type="doi">10.1093/ve/veaa027</pub-id></mixed-citation></ref><ref id="R10"><label>10. </label><mixed-citation publication-type="journal"><string-name><surname>Dong</surname>
<given-names>E</given-names></string-name>, <string-name><surname>Du</surname>
<given-names>H</given-names></string-name>, <string-name><surname>Gardner</surname>
<given-names>L</given-names></string-name>. <article-title>An interactive web-based dashboard to track COVID-19 in real time.</article-title>
<source>Lancet Infect Dis</source>. <year>2020</year>;<volume>20</volume>:<fpage>533</fpage>&#x02013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30120-1</pub-id><pub-id pub-id-type="pmid">32087114</pub-id></mixed-citation></ref><ref id="R11"><label>11. </label><mixed-citation publication-type="journal"><string-name><surname>Oude Munnink</surname>
<given-names>BB</given-names></string-name>, <string-name><surname>Nieuwenhuijse</surname>
<given-names>DF</given-names></string-name>, <string-name><surname>Stein</surname>
<given-names>M</given-names></string-name>, <string-name><surname>O&#x02019;Toole</surname>
<given-names>&#x000c1;</given-names></string-name>, <string-name><surname>Haverkate</surname>
<given-names>M</given-names></string-name>, <string-name><surname>Mollers</surname>
<given-names>M</given-names></string-name>, <etal>et al.</etal>; <collab>Dutch-Covid-19 response team</collab>. <article-title>Rapid SARS-CoV-2 whole-genome sequencing and analysis for informed public health decision-making in the Netherlands.</article-title>
<source>Nat Med</source>. <year>2020</year>;<volume>26</volume>:<fpage>1405</fpage>&#x02013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-020-0997-y</pub-id><pub-id pub-id-type="pmid">32678356</pub-id></mixed-citation></ref><ref id="R12"><label>12. </label><mixed-citation publication-type="journal"><string-name><surname>Kalinich</surname>
<given-names>CC</given-names></string-name>, <string-name><surname>Jensen</surname>
<given-names>CG</given-names></string-name>, <string-name><surname>Neugebauer</surname>
<given-names>P</given-names></string-name>, <string-name><surname>Petrone</surname>
<given-names>ME</given-names></string-name>, <string-name><surname>Pe&#x000f1;a-Hern&#x000e1;ndez</surname>
<given-names>M</given-names></string-name>, <string-name><surname>Ott</surname>
<given-names>IM</given-names></string-name>, <etal>et al.</etal>
<article-title>Real-time public health communication of local SARS-CoV-2 genomic epidemiology.</article-title>
<source>PLoS Biol</source>. <year>2020</year>;<volume>18</volume>:<elocation-id>e3000869</elocation-id>. <pub-id pub-id-type="doi">10.1371/journal.pbio.3000869</pub-id><pub-id pub-id-type="pmid">32822393</pub-id></mixed-citation></ref><ref id="R13"><label>13. </label><mixed-citation publication-type="journal"><string-name><surname>Rockett</surname>
<given-names>RJ</given-names></string-name>, <string-name><surname>Arnott</surname>
<given-names>A</given-names></string-name>, <string-name><surname>Lam</surname>
<given-names>C</given-names></string-name>, <string-name><surname>Sadsad</surname>
<given-names>R</given-names></string-name>, <string-name><surname>Timms</surname>
<given-names>V</given-names></string-name>, <string-name><surname>Gray</surname>
<given-names>K-A</given-names></string-name>, <etal>et al.</etal>
<article-title>Revealing COVID-19 transmission in Australia by SARS-CoV-2 genome sequencing and agent-based modeling.</article-title>
<source>Nat Med</source>. <year>2020</year>;<volume>26</volume>:<fpage>1398</fpage>&#x02013;<lpage>404</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-020-1000-7</pub-id><pub-id pub-id-type="pmid">32647358</pub-id></mixed-citation></ref><ref id="R14"><label>14. </label><mixed-citation publication-type="journal"><string-name><surname>Bauer</surname>
<given-names>DC</given-names></string-name>, <string-name><surname>Tay</surname>
<given-names>AP</given-names></string-name>, <string-name><surname>Wilson</surname>
<given-names>LOW</given-names></string-name>, <string-name><surname>Reti</surname>
<given-names>D</given-names></string-name>, <string-name><surname>Hosking</surname>
<given-names>C</given-names></string-name>, <string-name><surname>McAuley</surname>
<given-names>AJ</given-names></string-name>, <etal>et al.</etal>
<article-title>Supporting pandemic response using genomics and bioinformatics: A case study on the emergent SARS-CoV-2 outbreak.</article-title>
<source>Transbound Emerg Dis</source>. <year>2020</year>;<volume>67</volume>:<fpage>1453</fpage>&#x02013;<lpage>62</lpage>. <pub-id pub-id-type="doi">10.1111/tbed.13588</pub-id><pub-id pub-id-type="pmid">32306500</pub-id></mixed-citation></ref><ref id="R15"><label>15. </label><mixed-citation publication-type="journal"><string-name><surname>Jefferies</surname>
<given-names>S</given-names></string-name>, <string-name><surname>French</surname>
<given-names>N</given-names></string-name>, <string-name><surname>Gilkison</surname>
<given-names>C</given-names></string-name>, <string-name><surname>Graham</surname>
<given-names>G</given-names></string-name>, <string-name><surname>Hope</surname>
<given-names>V</given-names></string-name>, <string-name><surname>Marshall</surname>
<given-names>J</given-names></string-name>, <etal>et al.</etal>
<article-title>COVID-19 in New Zealand and the impact of the national response: a descriptive epidemiological study.</article-title>
<source>Lancet Public Health</source>. <year>2020</year>;<volume>5</volume>:<fpage>e612</fpage>&#x02013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1016/S2468-2667(20)30225-5</pub-id><pub-id pub-id-type="pmid">33065023</pub-id></mixed-citation></ref><ref id="R16"><label>16. </label><mixed-citation publication-type="journal"><string-name><surname>Freed</surname>
<given-names>NE</given-names></string-name>, <string-name><surname>Vlkov&#x000e1;</surname>
<given-names>M</given-names></string-name>, <string-name><surname>Faisal</surname>
<given-names>MB</given-names></string-name>, <string-name><surname>Silander</surname>
<given-names>OK</given-names></string-name>. <article-title>Rapid and inexpensive whole-genome sequencing of SARS-CoV-2 using 1200&#x02009;bp tiled amplicons and Oxford Nanopore Rapid Barcoding.</article-title>
<source>Biol Methods Protoc</source>. <year>2020</year>;<volume>5</volume>:<fpage>a014</fpage>. <pub-id pub-id-type="doi">10.1093/biomethods/bpaa014</pub-id><pub-id pub-id-type="pmid">33029559</pub-id></mixed-citation></ref><ref id="R17"><label>17. </label><mixed-citation publication-type="journal"><string-name><surname>Rambaut</surname>
<given-names>A</given-names></string-name>, <string-name><surname>Holmes</surname>
<given-names>EC</given-names></string-name>, <string-name><surname>O&#x02019;Toole</surname>
<given-names>&#x000c1;</given-names></string-name>, <string-name><surname>Hill</surname>
<given-names>V</given-names></string-name>, <string-name><surname>McCrone</surname>
<given-names>JT</given-names></string-name>, <string-name><surname>Ruis</surname>
<given-names>C</given-names></string-name>, <etal>et al.</etal>
<article-title>A dynamic nomenclature proposal for SARS-CoV-2 lineages to assist genomic epidemiology.</article-title>
<source>Nat Microbiol</source>. <year>2020</year>;<volume>5</volume>:<fpage>1403</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1038/s41564-020-0770-5</pub-id><pub-id pub-id-type="pmid">32669681</pub-id></mixed-citation></ref><ref id="R18"><label>18. </label><mixed-citation publication-type="journal"><string-name><surname>Katoh</surname>
<given-names>K</given-names></string-name>, <string-name><surname>Standley</surname>
<given-names>DM</given-names></string-name>. <article-title>MAFFT multiple sequence alignment software version 7: improvements in performance and usability.</article-title>
<source>Mol Biol Evol</source>. <year>2013</year>;<volume>30</volume>:<fpage>772</fpage>&#x02013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id><pub-id pub-id-type="pmid">23329690</pub-id></mixed-citation></ref><ref id="R19"><label>19. </label><mixed-citation publication-type="journal"><string-name><surname>Bouckaert</surname>
<given-names>R</given-names></string-name>, <string-name><surname>Vaughan</surname>
<given-names>TG</given-names></string-name>, <string-name><surname>Barido-Sottani</surname>
<given-names>J</given-names></string-name>, <string-name><surname>Duch&#x000ea;ne</surname>
<given-names>S</given-names></string-name>, <string-name><surname>Fourment</surname>
<given-names>M</given-names></string-name>, <string-name><surname>Gavryushkina</surname>
<given-names>A</given-names></string-name>, <etal>et al.</etal>
<article-title>BEAST 2.5: An advanced software platform for Bayesian evolutionary analysis.</article-title>
<source>PLOS Comput Biol</source>. <year>2019</year>;<volume>15</volume>:<elocation-id>e1006650</elocation-id>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1006650</pub-id><pub-id pub-id-type="pmid">30958812</pub-id></mixed-citation></ref><ref id="R20"><label>20. </label><mixed-citation publication-type="journal"><string-name><surname>Drummond</surname>
<given-names>AJ</given-names></string-name>, <string-name><surname>Rambaut</surname>
<given-names>A</given-names></string-name>, <string-name><surname>Shapiro</surname>
<given-names>B</given-names></string-name>, <string-name><surname>Pybus</surname>
<given-names>OG</given-names></string-name>. <article-title>Bayesian coalescent inference of past population dynamics from molecular sequences.</article-title>
<source>Mol Biol Evol</source>. <year>2005</year>;<volume>22</volume>:<fpage>1185</fpage>&#x02013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msi103</pub-id><pub-id pub-id-type="pmid">15703244</pub-id></mixed-citation></ref><ref id="R21"><label>21. </label><mixed-citation publication-type="journal"><string-name><surname>Letunic</surname>
<given-names>I</given-names></string-name>, <string-name><surname>Bork</surname>
<given-names>P</given-names></string-name>. <article-title>Interactive Tree Of Life (iTOL) v4: recent updates and new developments.</article-title>
<source>Nucleic Acids Res</source>. <year>2019</year>;<volume>47</volume>(<issue>W1</issue>):<fpage>W256</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz239</pub-id><pub-id pub-id-type="pmid">30931475</pub-id></mixed-citation></ref></ref-list></back></article>