<!DOCTYPE article
PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD with MathML3 v1.3 20210610//EN" "JATS-archivearticle1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="1.3" xml:lang="en" article-type="research-article"><?properties manuscript?><processing-meta base-tagset="archiving" mathml-version="3.0" table-model="xhtml" tagset-family="jats"><restricted-by>pmc</restricted-by></processing-meta><front><journal-meta><journal-id journal-id-type="nlm-journal-id">9107782</journal-id><journal-id journal-id-type="pubmed-jr-id">8548</journal-id><journal-id journal-id-type="nlm-ta">Curr Biol</journal-id><journal-id journal-id-type="iso-abbrev">Curr Biol</journal-id><journal-title-group><journal-title>Current biology : CB</journal-title></journal-title-group><issn pub-type="ppub">0960-9822</issn><issn pub-type="epub">1879-0445</issn></journal-meta><article-meta><article-id pub-id-type="pmid">37295427</article-id><article-id pub-id-type="pmc">10316540</article-id><article-id pub-id-type="doi">10.1016/j.cub.2023.05.047</article-id><article-id pub-id-type="manuscript">NIHMS1907424</article-id><article-categories><subj-group subj-group-type="heading"><subject>Article</subject></subj-group></article-categories><title-group><article-title>Dynamics of Eastern equine encephalitis virus during the 2019 outbreak in the Northeast United States</article-title></title-group><contrib-group><contrib contrib-type="author"><name><surname>Hill</surname><given-names>Verity</given-names></name><xref rid="A1" ref-type="aff">1</xref><xref rid="FN1" ref-type="author-notes">*</xref><xref rid="CR1" ref-type="corresp">@</xref></contrib><contrib contrib-type="author"><name><surname>Koch</surname><given-names>Robert T.</given-names></name><xref rid="A1" ref-type="aff">1</xref><xref rid="FN1" ref-type="author-notes">*</xref></contrib><contrib contrib-type="author"><name><surname>Bialosuknia</surname><given-names>Sean M.</given-names></name><xref rid="A2" ref-type="aff">2</xref></contrib><contrib contrib-type="author"><name><surname>Ngo</surname><given-names>Kiet</given-names></name><xref rid="A2" ref-type="aff">2</xref></contrib><contrib contrib-type="author"><name><surname>Zink</surname><given-names>Steven D.</given-names></name><xref rid="A2" ref-type="aff">2</xref></contrib><contrib contrib-type="author"><name><surname>Koetzner</surname><given-names>Cheri A.</given-names></name><xref rid="A2" ref-type="aff">2</xref></contrib><contrib contrib-type="author"><name><surname>Maffei</surname><given-names>Joseph G.</given-names></name><xref rid="A2" ref-type="aff">2</xref></contrib><contrib contrib-type="author"><name><surname>Dupuis</surname><given-names>Alan P.</given-names></name><xref rid="A2" ref-type="aff">2</xref></contrib><contrib contrib-type="author"><name><surname>Backenson</surname><given-names>P. Bryon</given-names></name><xref rid="A3" ref-type="aff">3</xref></contrib><contrib contrib-type="author"><name><surname>Oliver</surname><given-names>JoAnne</given-names></name><xref rid="A4" ref-type="aff">4</xref><xref rid="A5" ref-type="aff">5</xref></contrib><contrib contrib-type="author"><name><surname>Bransfield</surname><given-names>Angela B.</given-names></name><xref rid="A6" ref-type="aff">6</xref></contrib><contrib contrib-type="author"><name><surname>Misencik</surname><given-names>Michael J.</given-names></name><xref rid="A6" ref-type="aff">6</xref></contrib><contrib contrib-type="author"><name><surname>Petruff</surname><given-names>Tanya A.</given-names></name><xref rid="A6" ref-type="aff">6</xref></contrib><contrib contrib-type="author"><name><surname>Shepard</surname><given-names>John J.</given-names></name><xref rid="A6" ref-type="aff">6</xref></contrib><contrib contrib-type="author"><name><surname>Warren</surname><given-names>Joshua L.</given-names></name><xref rid="A7" ref-type="aff">7</xref><xref rid="A8" ref-type="aff">8</xref></contrib><contrib contrib-type="author"><name><surname>Gill</surname><given-names>Mandev S.</given-names></name><xref rid="A9" ref-type="aff">9</xref></contrib><contrib contrib-type="author"><name><surname>Baele</surname><given-names>Guy</given-names></name><xref rid="A10" ref-type="aff">10</xref></contrib><contrib contrib-type="author"><name><surname>Vogels</surname><given-names>Chantal B.F.</given-names></name><xref rid="A1" ref-type="aff">1</xref></contrib><contrib contrib-type="author"><name><surname>Gallagher</surname><given-names>Glen</given-names></name><xref rid="A11" ref-type="aff">11</xref><xref rid="A12" ref-type="aff">12</xref></contrib><contrib contrib-type="author"><name><surname>Burns</surname><given-names>Paul</given-names></name><xref rid="A11" ref-type="aff">11</xref></contrib><contrib contrib-type="author"><name><surname>Hentoff</surname><given-names>Aaron</given-names></name><xref rid="A11" ref-type="aff">11</xref></contrib><contrib contrib-type="author"><name><surname>Smole</surname><given-names>Sandra</given-names></name><xref rid="A11" ref-type="aff">11</xref></contrib><contrib contrib-type="author"><name><surname>Brown</surname><given-names>Catherine</given-names></name><xref rid="A11" ref-type="aff">11</xref></contrib><contrib contrib-type="author"><name><surname>Osborne</surname><given-names>Matthew</given-names></name><xref rid="A11" ref-type="aff">11</xref></contrib><contrib contrib-type="author"><name><surname>Kramer</surname><given-names>Laura D.</given-names></name><xref rid="A2" ref-type="aff">2</xref><xref rid="A13" ref-type="aff">13</xref></contrib><contrib contrib-type="author"><name><surname>Armstrong</surname><given-names>Philip M.</given-names></name><xref rid="A1" ref-type="aff">1</xref><xref rid="A5" ref-type="aff">5</xref><xref rid="FN2" ref-type="author-notes">#</xref><xref rid="CR1" ref-type="corresp">@</xref></contrib><contrib contrib-type="author"><name><surname>Ciota</surname><given-names>Alexander T.</given-names></name><xref rid="A2" ref-type="aff">2</xref><xref rid="A13" ref-type="aff">13</xref><xref rid="FN2" ref-type="author-notes">#</xref><xref rid="CR1" ref-type="corresp">@</xref></contrib><contrib contrib-type="author"><name><surname>Grubaugh</surname><given-names>Nathan D.</given-names></name><xref rid="A1" ref-type="aff">1</xref><xref rid="A7" ref-type="aff">7</xref><xref rid="A14" ref-type="aff">14</xref><xref rid="FN2" ref-type="author-notes">#</xref><xref rid="CR1" ref-type="corresp">@</xref><xref rid="CR2" ref-type="corresp">!</xref></contrib></contrib-group><aff id="A1"><label>1</label>Department of Epidemiology of Microbial Diseases, Yale School of Public Health, New Haven, CT, USA, 06510</aff><aff id="A2"><label>2</label>The Arbovirus Laboratory, New York State Department of Health, Wadsworth Center, Slingerlands, NY, USA, 12159</aff><aff id="A3"><label>3</label>New York State Department of Health, Bureau of Communicable Disease Control, Albany, NY, USA, 12237</aff><aff id="A4"><label>4</label>New York State Department of Health, Bureau of Communicable Disease Control, Syracuse, NY, USA, 13202</aff><aff id="A5"><label>5</label>Division of Environmental and Renewable Resources, State University of New York at Morrisville - School of Agriculture, Business and Technology, Morrisville, NY, USA, 13408</aff><aff id="A6"><label>6</label>Center for Vector Biology and Zoonotic Diseases, Department of Entomology, The Connecticut Agricultural Experiment Station, New Haven, CT, USA, 06511</aff><aff id="A7"><label>7</label>Department of Biostatistics, Yale School of Public Health, New Haven, CT, USA, 06510</aff><aff id="A8"><label>8</label>Public Health Modeling Unit, Yale School of Public Health, New Haven, CT, USA, 06510</aff><aff id="A9"><label>9</label>Department of Statistics, University of Georgia, Athens, GA, USA, 30602</aff><aff id="A10"><label>10</label>Department of Microbiology, Immunology and Transplantation, Rega Institute, KU Leuven, Leuven, Belgium, BE-3000</aff><aff id="A11"><label>11</label>Massachusetts Department of Public Health, Boston, MA, USA, 02108</aff><aff id="A12"><label>12</label>Rhode Island State Health Laboratory, Rhode Island Department of Health, Providence, RI, USA, 02904</aff><aff id="A13"><label>13</label>Department of Biomedical Sciences, State University of New York at Albany School of Public Health, Albany, NY, USA, 12237</aff><aff id="A14"><label>14</label>Department of Ecology and Evolutionary Biology, Yale University, New Haven, CT, USA</aff><author-notes><fn id="FN1"><label>*</label><p id="P1">Co-first authors</p></fn><fn id="FN2"><label>#</label><p id="P2">Co-senior authors</p></fn><fn fn-type="con" id="FN3"><p id="P3">Author contributions</p><p id="P4">V.H., R.T.K., P.M.A, A.T.C, and N.D.G conceptualized the study. V.H., R.T.K., J.L.W., M.S.G, G.B., N.D.G., Development or design of methodology; creation of models. M.S.G, G.B. Programming, software development; designing computer programs; implementation of the computer code and supporting algorithms; testing of existing code components. V.H., R.T.K., Formal analysis. S.M.B., K.N, S.D.Z, C.A.K, J.G.M, A.P.D, P.B.B, J.O., A.B.B, M.J.M., T.A.P., J.J.S, G.G., P.B., A.H., S.S., C.B., M.O., L.D.K., P.M.A., A.T.C Provision of study materials, reagents, materials, patients, laboratory samples, animals, instrumentation, computing resources, or other analysis tools. V.H., R.T.K., S.M.B, J.O., J.J.S., A.T.C., P.M.A Data Curation. V.H., R.T.K., S.M.B. N.D.G., C.F.V., A.T.C., P.M.A Writing &#x02013; original draft. All authors contributed to review and editing of the manuscript. V.H. and R.T.K. Visualization. G.G., P.M.A., A.T.C., N.D.G Supervision</p></fn><corresp id="CR1"><label>@</label>Co-corresponding authors: VH (<email>verity.hill@yale.edu</email>), PMA (<email>Philip.Armstrong@ct.gov</email>), ATC (<email>alexander.ciota@health.ny.gov</email>), NDG (<email>nathan.grubaugh@yale.edu</email>)</corresp><corresp id="CR2"><label>!</label>Lead contact (<email>verity.hill@yale.edu</email>)</corresp></author-notes><pub-date pub-type="nihms-submitted"><day>22</day><month>6</month><year>2023</year></pub-date><pub-date pub-type="ppub"><day>19</day><month>6</month><year>2023</year></pub-date><pub-date pub-type="epub"><day>08</day><month>6</month><year>2023</year></pub-date><pub-date pub-type="pmc-release"><day>19</day><month>6</month><year>2024</year></pub-date><volume>33</volume><issue>12</issue><fpage>2515</fpage><lpage>2527.e6</lpage><abstract id="ABS1"><title>Summary</title><p id="P5">Eastern equine encephalitis virus (EEEV) causes a rare but severe disease in horses and humans, and is maintained in an enzootic transmission cycle between songbirds and <italic toggle="yes">Culiseta melanura</italic> mosquitoes. In 2019, the largest EEEV outbreak in the United States for more than 50 years occurred, centered in the Northeast. To explore the dynamics of the outbreak, we sequenced 80 isolates of EEEV and combined them with existing genomic data. We found that, like previous years, cases were driven by multiple independent but short-lived virus introductions into the Northeast from Florida. Once in the Northeast, we found that Massachusetts was important for regional spread. We found no evidence of any changes in viral, human, or bird factors which would explain the increase in cases in 2019, although the ecology of EEEV is complex and further data is required to explore these in more detail. By using detailed mosquito surveillance data collected by Massachusetts and Connecticut, however, we found that the abundance of <italic toggle="yes">Cs. melanura</italic> was exceptionally high in 2019, as was the EEEV infection rate. We employed these mosquito data to build a negative binomial regression model and applied it to estimate early season risks of human or horse cases. We found that the month of first detection of EEEV in mosquito surveillance data and vector index (abundance multiplied by infection rate) were predictive of cases later in the season. We therefore highlight the importance of mosquito surveillance programs as an integral part of public health and disease control.</p></abstract><abstract id="ABS2" abstract-type="summary"><title>Blurb:</title><p id="P6">Hill <italic toggle="yes">et al.</italic> investigate the drivers behind outbreaks of Eastern Equine Encephalitis Virus in the northeast US, including a large one in 2019. Using virus genome sequencing and mosquito surveillance data, they show it was caused by several small virus introductions from Florida and could be predicted by mosquito abundance and infection rates.</p></abstract></article-meta></front><body><sec id="S1"><title>Introduction</title><p id="P7">Eastern equine encephalitis virus (EEEV) is a mosquito-borne virus that has caused periodic outbreaks in humans, horses, and other agricultural animals in the United States (US) since its discovery in 1933<sup><xref rid="R1" ref-type="bibr">1</xref>,<xref rid="R2" ref-type="bibr">2</xref></sup>. The virus circulates in a bird-mosquito transmission cycle while infections of most mammals are considered &#x0201c;dead end hosts&#x0201d;. In humans, EEEV can cause severe disease, with an apparent case fatality rate of 30% and long-term neurological sequelae in more than half of those who survive<sup><xref rid="R3" ref-type="bibr">3</xref></sup>. Still, diagnosed human cases are rare, with an average of 7 per year in the US. The largest human outbreak in more than 50 years was in 2019, with 38 cases and 12 deaths<sup><xref rid="R4" ref-type="bibr">4</xref></sup>. The outbreak was not limited to the East Coast where cases are typically detected, as 10 of the human cases that year were reported from Michigan. The widespread EEEV cases in 2019 had significant impacts on the communities: many evening outdoor events were canceled to avoid mosquito exposure and aerial insecticide applications were the subject of public controversy<sup><xref rid="R5" ref-type="bibr">5</xref>,<xref rid="R6" ref-type="bibr">6</xref></sup>. Thus, understanding the drivers of EEEV outbreaks and how to accurately communicate risk to the public is of high importance<sup><xref rid="R7" ref-type="bibr">7</xref></sup>.</p><p id="P8">The key unanswered questions are (1) what factors facilitated the unprecedented EEEV activity in 2019, and (2) can we accurately estimate risk of human and horse infections? These are challenging questions to answer because the ecology of EEEV is complex, involving multiple species of bird and mosquito. <italic toggle="yes">Culiseta melanura</italic> serves as the main mosquito vector of EEEV in North America, lives in freshwater swamp habitats, and feeds primarily on passerine birds<sup><xref rid="R8" ref-type="bibr">8</xref></sup>. Historically, <italic toggle="yes">Coquillettidia perturbans</italic> was implicated in the spillover process to humans as bridge vectors (i.e., vectors which feed on both birds and mammals)<sup><xref rid="R9" ref-type="bibr">9</xref></sup>. This strict delineation between obligate avian and permissive feeders, however, is not absolute, and <italic toggle="yes">Cs. melanura</italic> has also been found to occasionally feed on mammals in the Northeast<sup><xref rid="R10" ref-type="bibr">10</xref></sup>. In terms of viral dynamics, previous work demonstrated that EEEV circulates year round in Florida and is introduced into the Northeast through seasonal bird migration<sup><xref rid="R11" ref-type="bibr">11</xref>,<xref rid="R12" ref-type="bibr">12</xref></sup>, although this process does not happen predictably every year. Predicting the annual case dynamics is therefore difficult, having to take into account viral dynamics across multiple species and geographic scales.</p><p id="P9">In this study, we sequenced 80 EEEV isolates and used a combination of phylodynamics, mosquito surveillance, and mathematical and statistical modeling to explore the dynamics of EEEV in the Northeast US. We specifically addressed the factors behind the 2019 outbreak with the aim of understanding if large outbreak years are predictable, or likely to be repeated. We confirmed that the 2019 outbreak was primarily driven by EEEV introductions from Florida rather than extended spread in the region. We also found that when there is regional spread in the Northeast it mostly originates from Massachusetts. We found no evidence of viral, human, or avian factors contributing to the 2019 outbreak, but found that mosquito surveillance data was able to explain much of the variation in human and horse cases, highlighting the importance of high-quality and routinely collected mosquito data.</p></sec><sec id="S2"><title>Results</title><sec id="S3"><title>High EEEV mosquito infections rates within known transmission foci</title><p id="P10">The outbreak of EEEV in humans and horses in 2019 was primarily focused in the Northeast US (see Methods). During 2019 there were 19 human and 26 horse cases reported in the Northeast US, compared to 11 human and 20 horse cases in 2005, the second largest outbreak since surveillance data became publicly available online via ArboNETin 2003 (<xref rid="F1" ref-type="fig">Figure 1A</xref>). The earliest human cases in the region were reported in July in Massachusetts. This is slightly earlier than the earliest Northeastern horse cases, which were reported in August across all Northeastern states other than Vermont (<xref rid="F1" ref-type="fig">Figure 1B</xref>). The last cases were in September in Connecticut and Massachusetts (human) and October in New York (horse).</p><p id="P11">Historically, there have been two foci of transmission in the Northeast: an eastern, coastal focus which encompasses most of Massachusetts and Connecticut, and a western focus in central New York towards Lake Ontario. While cases were recorded in both foci in 2019, the vast majority were in the eastern focus in Massachusetts and Connecticut, with no human cases and only 8 horse cases reported in upstate New York (<xref rid="F1" ref-type="fig">Figure 1C</xref>). Cases primarily occurred in counties which had reported EEEV-positive human, horses, or mosquitoes before 2019. Further, the two counties which had not previously detected EEEV (Cattaraugus and Ontario counties) are adjacent to counties which have (<xref rid="F1" ref-type="fig">Figure 1C</xref>). Therefore, there was not much geographical expansion in 2019, and cases fit into previously established transmission foci (<xref rid="F1" ref-type="fig">Figure 1C</xref>).</p><p id="P12">Using data from routine mosquito surveillance, we calculated the maximum-likelihood estimates (MLEs) of mosquito infection rates (see Methods). We found the number of tested <italic toggle="yes">Cs. melanura</italic> mosquitoes and EEEV infection rates in Massachusetts and Connecticut, two states with high 2019 case counts (<xref rid="F1" ref-type="fig">Figure 1A</xref>), were high in 2019 (<xref rid="F1" ref-type="fig">Figure 1D</xref>). The MLE infection rate in Massachusetts in 2019 was 3.62/1000 vs the 2003&#x02013;2018 average of 1.21/1000 (95% CI: 0.67&#x02013;1.75/1000), and in Connecticut it was 3.67/1000 vs 0.94/1000 (95% CI: 0.36&#x02013;1.52/1000).</p><p id="P13">New York, which reported cases in 2014 (12 horse and 2 human cases), 2015 (3 human cases), and 2018 (3 horse cases), had more of a normal EEEV year in 2019 (8 horse cases). Subsequently, we did not find a high number of tested <italic toggle="yes">Cs. melanura</italic> mosquitoes and EEEV infection rates in New York in 2019 (MLE infection rate 2019 = 3.30/1000; 2003&#x02013;2018 average = 2.49/1000, 95% CI: 1.53&#x02013;3.45/1000). In general, the mosquito infection rate patterns in Massachusetts and Connecticut are more similar to each other compared to New York, which is likely indicative of the two distinct geographical foci of transmission described above.</p></sec><sec id="S4"><title>The 2019 outbreak in the Northeast was caused by several recent virus introductions from Florida</title><p id="P14">To explore the underlying spatial dynamics of EEEV in the US, we performed a phylogeographic reconstruction on a state level to determine the timing and the source of viruses causing the 2019 outbreak. Phylogeographic analysis to reconstruct virus spread requires sequence data from across spatial and temporal scales. While EEEV genomic sequence data before 2003 are relatively sparse, there were some sequences from across the full range of years, with the earliest sequence from the first recorded outbreak in 1933 (<xref rid="F2" ref-type="fig">Figure 2A</xref>). Within the Northeast, EEEV sequencing was most concentrated on samples from southeastern Massachusetts and upstate New York (<xref rid="F2" ref-type="fig">Figure 2B</xref>). Nationally, most sequences were from the Northeast and Florida, although only until 2014 for the latter. There was sporadic sequencing as far west as Texas, although there are no sequences from many of the intermediate states along the east coast (<xref rid="F2" ref-type="fig">Figure 2C</xref>).</p><p id="P15">To improve the coverage of EEEV sequences, including from 2019, we sequenced an additional 80 isolates from across Massachusetts (n=17), Connecticut (n=38), and New York (n=25) (<xref rid="SD2" ref-type="supplementary-material">Table S1</xref>). They were primarily from <italic toggle="yes">Cs. melanura</italic> (n=63), although there were also isolates from other mosquito species, horses, and a turkey (<xref rid="SD2" ref-type="supplementary-material">Table S1</xref>). These isolates were sampled from 2015&#x02013;2019, including 48 from 2019, and were mostly from counties from which there were previously few or no sequences, particularly in Connecticut (<xref rid="F2" ref-type="fig">Figure 2B</xref>). Combining our new EEEV sequences with publicly available data (n = 531), we performed a joint phylogeographic and phylogenetic reconstruction (<xref rid="F2" ref-type="fig">Figure 2D</xref>). We estimate the time of origin of the US phylogeny to be 1923-03-15 (95% Highest Posterior Density (HPD): 1920-07-02 to 1925-11-25), ten years before EEEV was first detected causing a large horse outbreak in Virginia, 1933.<sup><xref rid="R1" ref-type="bibr">1</xref></sup></p><p id="P16">Supporting previous results of phylogeographic analysis<sup><xref rid="R12" ref-type="bibr">12</xref></sup>, we found that EEEV transmission in Florida acts as a source of virus introductions into other states (<xref rid="F2" ref-type="fig">Figure 2D</xref>). When investigating the movement between states across the whole posterior distribution of the phylogeographic reconstruction, we found that 86.7% of EEEV movements start in Florida, and end in every other state in the dataset (<xref rid="F2" ref-type="fig">Figure 2E</xref>). It is worth noting that there are not many sequences from states outside of Florida and the Northeast, and so movements involving states such as Texas, Georgia, and Virginia should be interpreted with caution, and there are likely regional dynamics which we could not uncover with this dataset.</p><p id="P17">Using our new EEEV sequences, we found that the 2019 outbreak in the Northeast involved several independent virus introductions (<xref rid="F2" ref-type="fig">Figure 2D</xref>), all from Florida. These introductions were not related to other previous EEEV clusters sequenced in the Northeast. Therefore, the 2019 outbreak in the Northeast consisted of multiple EEEV lineages most likely introduced from the reservoir population in Florida, as opposed to long-term regional persistence or a single introduction with explosive growth.</p></sec><sec id="S5"><title>EEEV lineages do not typically persist longer than a few years in the Northeast</title><p id="P18">Having found that EEEV circulation in the Northeast, including the 2019 outbreak, is mostly driven by repeated introductions from Florida, we explored the maintenance of these lineages once they become established in the region. Due to the lack of sequences from Florida in general, but especially after 2014, the clades estimated by our discrete phylogeographic analysis are likely not precise estimates of the timings of EEEV introductions into the Northeast (<xref rid="F2" ref-type="fig">Figure 2D</xref>). In particular, we expect that we have estimated larger and longer-lived clusters after 2014 than there are in reality, as they do not contain sequences from Florida which would pull the introduction date closer to the present. To account for this, we subdivided any Northeastern clusters with unexpectedly long internal branches (see Methods). This also included clusters from before 2014, indicating that sampling bias specifically involving Florida is an issue throughout the dataset. This procedure resulted in splitting the 61 EEEV introductions inferred from our discrete trait analysis into 75 separate introductions into the Northeast (<xref rid="F3" ref-type="fig">Figure 3A</xref>).</p><p id="P19">Of these 75 introductions, we found 26 consisting of three or more sequences. On average, these took 1.17 (95% HPD: 0.46&#x02013;3.27) years to be first detected in the genomic dataset and circulated in the Northeast for an average of 2.8 (95% HPD: 0.65&#x02013;7.5) years after being introduced (<xref rid="F3" ref-type="fig">Figure 3B</xref>). This supports previous analysis of the region showing limited multi-year maintenance in the region<sup><xref rid="R13" ref-type="bibr">13</xref>,<xref rid="R14" ref-type="bibr">14</xref></sup>. The groups of lineages can be seen to roughly follow three wave patterns in the 2000s, between 2010 and 2014, and then 2014 to 2019 (<xref rid="F3" ref-type="fig">Figure 3C</xref>), possibly corresponding to infection and immunity patterns within the bird population in the region.</p><p id="P20">Of the 26 larger Northeastern introductions, 8 included samples from the 2019 outbreak, and half of these were solely composed of 2019 samples (<xref rid="F3" ref-type="fig">Figure 3C</xref>). We estimate that the average introduction time of these 2019 clusters was in mid-2017 (95% HPD: 2015-11-14 to 2019-01-15), and the earliest introduction was late 2015. Therefore, the EEEV lineages sequenced from 2019 were introduced no more than 4 years before the outbreak and after the most recent Northeast EEEV outbreak in 2014.</p></sec><sec id="S6"><title>Multi-state spread of EEEV originating in Massachusetts</title><p id="P21">Considering that EEEV lineages have a short lifespan in the Northeast (<xref rid="F3" ref-type="fig">Figure 3</xref>), we subsequently investigated the extent to which they could spread within the region during that time. Of the 26 Northeast clusters with three or more EEEV sequences (<xref rid="F3" ref-type="fig">Figure 3C</xref>), most (n=19) were from a single state, and only a single cluster was found in three states despite the density of sequencing in the region. Of the 7 clusters with sequences from multiple states, we found that most viral movements were inferred to be from Massachusetts to other states (7 out of 8 movements in the MCC tree, <xref rid="F4" ref-type="fig">Figure 4A</xref>) and the origin of 5 out of 6 subtrees was in Massachusetts (<xref rid="F4" ref-type="fig">Figure 4B</xref>). The remaining subtree circulated mostly in Connecticut but contains a sequence from Massachusetts. Importantly, multi-state clusters were not necessarily sampled in neighboring counties (<xref rid="F4" ref-type="fig">Figure 4B</xref>), indicating true spread within the region, possibly by infected birds.</p><p id="P22">Only two of these multi-state clusters contain sequences from New York, despite the majority of EEEV sequences being from that state. These sequences were from the southeast of the state (<xref rid="F4" ref-type="fig">Figure 4B</xref>), closer to the prominent Massachusetts-Connecticut focus rather than the transmission clusters in upstate New York. Therefore, while limited regional spread is happening, it primarily only involves the eastern part of the region where smaller states are close together. We note however that uneven temporal and spatial sampling, even within the Northeast, may lead to undiscovered dynamics in multi-state spread.</p><p id="P23">While none of the multi-state clusters were solely sampled in 2019, we found that half of them contain EEEV sequences sampled in 2019 (<xref rid="F4" ref-type="fig">Figure 4B</xref>). Therefore, the 2019 outbreak appears to have a wider within-cluster geographical spread than previous ones (e.g., 2012&#x02013;2014 sequences are only found in 2 subtrees; <xref rid="F4" ref-type="fig">Figure 4B</xref>). The spread in 2019 was possibly driven by the high numbers of infected mosquitoes (<xref rid="F1" ref-type="fig">Figure 1D</xref>) leading to more infected birds and more opportunities for cross-state movements. We emphasize, however, that cases were mostly reported in counties that had previous EEEV cases (<xref rid="F1" ref-type="fig">Figure 1C</xref>), and so this was strictly a within-cluster effect and the outbreak as a whole does not show geographical expansion.</p></sec><sec id="S7"><title>Associations of virus, human, and bird factors with EEEV outbreaks were not found</title><p id="P24">The general epidemiology underlying the 2019 EEEV outbreak appears to be similar to previous outbreaks, with short-lived introductions from Florida driving transmission in the Northeast (<xref rid="F2" ref-type="fig">Figure 2</xref>&#x02013;<xref rid="F3" ref-type="fig">3</xref>), and infections occurring in similar locations (<xref rid="F1" ref-type="fig">Figure 1</xref>). Therefore any changes underlying case increases may be due to mosquito population, virus evolution, human behavior, or bird populations, and there are multiple possible factors that are not mutually exclusive. Determining which factors were important for the 2019 outbreak may help us to understand what drives EEEV outbreaks in general.</p><sec id="S8"><title>Intrinsic viral factors and effective population size</title><p id="P25">A major concern when any pathogen leads to a large increase in case counts is that it has evolved to have a higher virulence or transmissibility. In the case of EEEV, increased transmissibility would refer to a higher infection success in either mosquitoes or birds. Increased virulence would lead to increased case ascertainment, as diagnosis occurs on hospitalized individuals and most human infections are probably asymptomatic<sup><xref rid="R15" ref-type="bibr">15</xref></sup>. We would expect to see a phylogenetic signal for any intrinsic variability in transmissibility or virulence.</p><p id="P26">We searched the alignment for any nucleotide substitutions, relative to a reference sequence from 2005, which are common to some or all of the 2019 EEEV sequences. There were 17 substitutions across the genome shared by all of the 2019 sequences, a further two that more than 90% of them shared, and an additional two that 75% of them shared. These 21 substitutions, however, were found across the whole phylogeny, in at least 93% of non-2019 EEEV sequences. We found no shared substitutions unique to more than 75% the sequences sampled in 2019. This was expected given that these sequences are spread across the phylogeny (<xref rid="F2" ref-type="fig">Figure 2D</xref>), as there would have to be extremely strong positive selection leading to multiple instances of convergent evolution for unique shared substitutions to be possible. While some of these shared substitutions may have mild phenotypic effects, their spread across the phylogeny implies they are not a main driver of the increase in cases in 2019.</p><p id="P27">Past population size of viruses can be useful in inferring underlying transmission dynamics. We used a skygrid model<sup><xref rid="R16" ref-type="bibr">16</xref></sup> to estimate temporal changes in virus effective population size across the whole of the US. We found that there was a steady increase in effective population size in the 1990s, which then plateaued and decreased more recently in the late 2010s (<xref rid="SD1" ref-type="supplementary-material">Figure S1B</xref>). We then formally incorporated human and horse case data as covariates in the skygrid<sup><xref rid="R17" ref-type="bibr">17</xref></sup> hypothesizing that increased transmission in the mosquito-bird cycle could lead to more reported cases in humans and horses.</p><p id="P28">We tested 9 different case-based covariates independently using data from 2003 onwards, but we did not find any significant associations between the viral population size and any of these covariates (<xref rid="SD1" ref-type="supplementary-material">Figure S1C</xref>). There is, therefore, no simple association between national circulation and reported cases, meaning that regional dynamics are likely more important for regional cases.</p></sec><sec id="S9"><title>Case demographics and human behavior</title><p id="P29">Human behavior could be one explanation for the increase in human EEEV cases in 2019, which could be revealed by analyzing the case demographics. We did not however find any meaningful differences in case demographics or timing in 2019 compared to previous years since 2003 (<xref rid="SD1" ref-type="supplementary-material">Figure S2</xref>)</p><p id="P30">To further explore whether human behavior may have changed in 2019, leading to a higher EEEV exposure rate, we compared the length of time individuals spent outside in relevant counties in Massachusetts, Connecticut, and New York (<xref rid="SD1" ref-type="supplementary-material">Figure S2E</xref>). We performed a paired t-test on the indoor activity seasonality metric for each of these counties in June, July, August, and September between 2018 and 2019 (data only available for these years) using data from <sup><xref rid="R18" ref-type="bibr">18</xref></sup>. We found no evidence of a difference in indoor-ness between 2018 and 2019 in counties that had ever had a human case of EEEV (p=0.56) or only those which had a case in 2019 (p=0.72). Therefore, we found no evidence of time spent outdoors, the timing of cases, or case demographics being major drivers of EEEV outbreaks. Understanding the behaviors and activities linked to human exposure, however, is still an important area of research.</p></sec><sec id="S10"><title>Bird populations</title><p id="P31">Bird populations likely have a complicated role in EEEV outbreaks. While the presence of competent bird species is a necessity for EEEV transmission and large populations may lead to more infections, conversely, abnormally large bird populations may dilute the virus, decreasing the likelihood of mosquito infection during blood feeding<sup><xref rid="R19" ref-type="bibr">19</xref></sup>. Moreover, when sufficient opportunities exist for mosquitoes to feed on birds, it may limit the pursuit of mosquitoes to feed on alternate sources, such as humans and horses. Finally, bird population immunity is likely a key component of the potential for EEEV perpetuation, but studies that routinely collect bird serology data are difficult and not often conducted.</p><p id="P32">While data on birds are limited, we examined the effect of the (1) absolute abundance and (2) proportion relative to all species of 8 bird species for which <italic toggle="yes">Cs. melanura</italic> has a high blood feeding preference<sup><xref rid="R9" ref-type="bibr">9</xref>,<xref rid="R20" ref-type="bibr">20</xref></sup> on (A) human and horse cases and (B) mosquito EEEV infection rate using a Poisson regression. We also compared these metrics for 8 bird species for which a low feeding preference was estimated<sup><xref rid="R20" ref-type="bibr">20</xref></sup> as a control (<xref rid="SD1" ref-type="supplementary-material">Figure S3</xref>). There were no significant relationships when considering mosquito infection rates regardless of species or state. In New York, there were very few significant relationships in high-preference birds, and several in the low-preference bird species and so this comparison is likely not valid for New York. In Massachusetts and Connecticut, we found several positive relationships between case counts and high-preference bird species case counts (<xref rid="SD1" ref-type="supplementary-material">Figure S3</xref>) but also with a smaller number of low-preference birds. The relationship between specific bird presence and EEEV transmission is therefore complicated and not easily solved here. There are, however, some low-preference birds with significant relationships (although fewer), meaning that the relationship between specific bird presence and EEEV transmission/cases is complicated and not easily solved here.</p></sec></sec><sec id="S11"><title>EEEV outbreaks are primarily driven by the infection dynamics within mosquito populations</title><p id="P33">After finding no evidence for associations with other factors, we subsequently focused on mosquitoes where we have detailed temporal data. For all three states, when there were more EEEV-positive <italic toggle="yes">Cs. melanura</italic> pools, there were more human and horse cases (<xref rid="F5" ref-type="fig">Figure 5A</xref>), and we also found the same strong correlation between the <italic toggle="yes">Cs. melanura</italic> infection rates and case counts (<xref rid="SD1" ref-type="supplementary-material">Figure S4A</xref>&#x02013;<xref rid="SD1" ref-type="supplementary-material">B</xref>). To further explore the within-season EEEV dynamics, we focused on Connecticut and Massachusetts, for which we have more detailed mosquito data. We examined monthly <italic toggle="yes">Cs. melanura</italic> abundance (mosquitoes/trap/day), EEEV infection rate, and vector index (abundance multiplied by the infection rate to estimate the relative number of infected mosquitoes<sup><xref rid="R21" ref-type="bibr">21</xref>,<xref rid="R22" ref-type="bibr">22</xref></sup>) for each state (<xref rid="F5" ref-type="fig">Figure 5B</xref>). While there were considerable yearly variations, in general <italic toggle="yes">Cs. melanura</italic> abundance rapidly increased in early summer, peaking by June to July. The EEEV infection rates lagged behind, peaking in August or September, with infected mosquitoes often being detected in Massachusetts earlier than Connecticut. Vector index, therefore, tended to rise earlier (July) and persist longer in Massachusetts than Connecticut, though it often peaks in August in both states. In 2019, we found that both the <italic toggle="yes">Cs. melanura</italic> abundance and EEEV infection rates were high in both states, leading to the highest vector index values in the 17-year dataset (<xref rid="F5" ref-type="fig">Figure 5B</xref>).</p><p id="P34">We next investigated whether environmental data could help explain the high abundances or EEEV infection rates. To explore this, we used index P<sup><xref rid="R23" ref-type="bibr">23</xref></sup>, a modeled estimate of reproduction number of mosquito-borne viruses based on climate factors, including temperature and humidity (<xref rid="SD1" ref-type="supplementary-material">Table S2</xref>). While our index P estimates usually peaked in July to August, similar to the vector index, we found that it correlated most closely with the <italic toggle="yes">Cs. melanura</italic> abundance (<xref rid="SD1" ref-type="supplementary-material">Figure S4C</xref>; correlation coefficient of 0.57, p&#x0003c;0.0001 for Connecticut, 0.24 and p&#x0003c;0.05 for Massachusetts). Furthermore, our modeled index P in 2019 was relatively average across the 17 years in both states (rank 9/17 for Connecticut, 7/17 for Massachusetts). Thus, for EEEV in the Northeast, index P is useful for describing the seasonal dynamics of transmission due to its ability to predict abundance, but the temperature and humidity variables alone are not capable of describing which years will have a high number of EEEV-infected mosquitoes.</p><p id="P35">To interrogate further how different factors combine to explain cases, we built a negative binomial regression model that uses index P, vector index, state, month of first EEEV detection, the year, and the month to explore counts of total human and horse cases (<xref rid="F5" ref-type="fig">Figure 5C</xref>&#x02013;<xref rid="F5" ref-type="fig">D</xref>, <xref rid="SD1" ref-type="supplementary-material">Table S3</xref>; results from different variations of the model are shown in <xref rid="SD1" ref-type="supplementary-material">Figure S5</xref>). Vector index (2.07, 95% CI: 1.5&#x02013;3.0), the month of first detection compared to June (3.17, 95% CI: 1.34&#x02013;7.92), index P with a 1-month lag (2.31, 95% CI: 1.19&#x02013;4.65), and being in the month of October (4.18, 95% CI: 1.39&#x02013;13.55), all lead to a significant increase in the risk of human and horse cases (<xref rid="F5" ref-type="fig">Figure 5C</xref>). Further, being in Massachusetts as compared to Connecticut had the largest increase in risk (11.95, 95% CI: 3.88&#x02013;43.70<italic toggle="yes">)</italic>. When used to fit cases each year, our modeled estimates tracked closely with observed cases, where cases with the model being off on average by 0.47 cases per observation (Mean Absolute Error = 0.47) and had strong explanatory power (Nagelkerke R<sup>2</sup> = 0.80; <xref rid="F5" ref-type="fig">Figure 5D</xref>).</p><p id="P36">Next, we applied this model to examine if there were early season predictors which might indicate an increased risk of horse and human cases later in the season (<xref rid="F5" ref-type="fig">Figure 5E</xref>). As index P does not correlate well with vector index, we held index P constant and simulated vector index across a range of values to predict the total human and horse cases for the year, and to explore its relationship with the month of first detection. The timing of the first detection of EEEV in mosquitoes is also important, and of particular note is that years with high case counts always first detected EEEV in July (<xref rid="F5" ref-type="fig">Figure 5E</xref>). This makes intuitive sense as the virus has more time to circulate to high levels in birds while there are sufficient mosquitoes present for it to transmit to humans. While the interaction between first EEEV detection in July and the vector index is not significant, this could be in part due to no cases being detected in years when the vector index was high but EEEV was first detected after July. The impact of the timing of the vector index is clear however, with a 220% increase in risk of cases when EEEV is detected in July (<xref rid="F5" ref-type="fig">Figure 5E</xref>). This is reflected in the empirical data, as the maximum number of cases in years when EEEV is detected after July is only 5.</p><p id="P37">Our negative-binomial regression model could be used as a tool for mosquito surveillance programs to estimate the risk of cases, which typically are reported in August-October, based on the timing of first detection and the vector index. For example, if EEEV is detected in mosquitoes in July in Massachusetts, and the vector index in August is 0.15 (similar to the value measured in 2019), we predict 7.0 human and horse cases in total that year (95% CI: 2.9&#x02013;16.6), compared to 2.2 cases (95% CI: 0.6&#x02013;7.9) if EEEV is detected after July during a typical summer season. In Connecticut, the same situation would correspond to an expected 0.6 cases (95% CI: 0.2&#x02013;1.8) for July detection and 0.2 cases (95% CI: 0.1 to 0.6) for a later detection. With a more extreme August vector index of 0.30 in Massachusetts (higher than has ever been measured), our model predicts 89.2 cases (95% CI: 17.0&#x02013;468.5) if EEEV is detected in July versus 28.2 cases (95% CI: 3.4&#x02013;231.3) cases being detected later. While these predictions have wide confidence intervals, they provide a relative estimate of the possible extent of the cases in a given year, and therefore an indication of how much effort should be put into various mosquito control measures.</p><p id="P38">Finally, while all of our previous results focused on <italic toggle="yes">Cs. melanura, Coquillettidia perturbans</italic> is also thought to be an important bridge vector for infections in horses and humans<sup><xref rid="R9" ref-type="bibr">9</xref>,<xref rid="R24" ref-type="bibr">24</xref></sup>. This species has higher trap collectionson average in Connecticut than <italic toggle="yes">Cs. melanura</italic> (<xref rid="SD1" ref-type="supplementary-material">Figure S4D</xref>). However, only 9 <italic toggle="yes">Cq. perturbans</italic> pools were positive for EEEV from 2003&#x02013;2019 in the state, or 1.9% of all positive pools; and it was only the 8th most commonly positive mosquito species for EEEV. In 2019, there were six EEEV positive pools of <italic toggle="yes">Cq. perturbans</italic> sampled in Connecticut, making it the third most commonly sampled positive mosquito species for the year, although it still only made up 5% of the positive mosquito pools. s <italic toggle="yes">Cq. perturbans</italic> did however make up a third of positive pools in Massachusetts in 2019<sup><xref rid="R9" ref-type="bibr">9</xref></sup>. Therefore, <italic toggle="yes">Cq. perturbans</italic> may still have a role as a bridge vector, but the transmission dynamics of EEEV in these states is primarily driven by <italic toggle="yes">Cs. melanura.</italic></p></sec></sec><sec id="S12"><title>Discussion</title><p id="P39">The 2019 EEEV outbreak in the Northeast US was exceptional in that it had the highest number of human cases recorded in more than 50 years, along with dense <italic toggle="yes">Cs. melanura</italic> vector populations with high virus infection rates (<xref rid="F1" ref-type="fig">Figure 1</xref> &#x00026; <xref rid="F5" ref-type="fig">5</xref>). We found that other components of 2019 were similar to previous outbreaks. We showed that EEEV is not persistently maintained in the Northeast, with virus lineages typically going extinct within the region within a few years (<xref rid="F3" ref-type="fig">Figure 3</xref>). Instead, the virus is frequently reintroduced into the region from Florida, where EEEV is enzootic (<xref rid="F2" ref-type="fig">Figure 2</xref>). Thus, EEEV outbreaks in the Northeast are limited by stochastic and deterministic factors that support new virus introductions, and to habitats that are suitable for the mosquito vectors. We identified two primary transmission foci in the Northeast: (<italic toggle="yes">1</italic>) an eastern, coastal focus which encompasses most of Massachusetts and Connecticut, and (<italic toggle="yes">2</italic>) a western focus in central New York (<xref rid="F1" ref-type="fig">Figure 1</xref>). The 2019 outbreak primarily occurred in the former. We found that human and horse cases are associated with a high vector index (large number of EEEV infected <italic toggle="yes">Cs. melanura</italic> mosquitoes), and we constructed a model using environmental and mosquito surveillance data that could estimate cases (<xref rid="F5" ref-type="fig">Figure 5</xref>). Finally, we found that a high early season vector index can be used by surveillance systems to predict human EEEV risk and direct control efforts (<xref rid="F5" ref-type="fig">Figure 5E</xref>). It remains unclear as to what causes high EEEV infection rates in mosquitoes, and therefore what contributed to the exceptionally high rate in 2019.</p><p id="P40">We conducted a phylodynamic analysis of our 80 newly-generated EEEV genome sequences combined with historical samples to explore the dynamics of EEEV in the Northeast of the US, with a focus on 2019 (<xref rid="F2" ref-type="fig">Figure 2</xref>). As both EEEV isolates and extracted RNA are designated as Select Agents in the US, it is extremely difficult to obtain clearance to store, transport, and in this case, sequence them. Thus our genomic dataset is critical to support future EEEV research. Using these additional sequences, we confirmed earlier studies which identified Florida as the source of EEEV introductions into the Northeast and other parts of the US<sup><xref rid="R12" ref-type="bibr">12</xref></sup> (<xref rid="F2" ref-type="fig">Figure 2</xref>). The documented endemic transmission in Florida and the limited number of EEEV cases reported outside of the US add further support to the hypothesis of Florida as a source for the Northeast. EEEV sequences from outside of the US, however, are limited in number (n=3) and we did not include these data in our analysis. Therefore, we cannot rule out a non-US external source of introductions into the Northeast. Further sequencing from other countries, enabling a broader, regional analysis of EEEV would allow the investigation of the international dynamics of EEEV and the identification of at-risk regions.</p><p id="P41">We found that while interstate spread of EEEV within the Northeast is not common, Massachusetts appears to be an important focus for when it does happen (<xref rid="F4" ref-type="fig">Figure 4</xref>). This may be in part due to bird migration routes, more consistent EEEV activity in Massachusetts compared to the surrounding states (<xref rid="F1" ref-type="fig">Figure 1</xref> &#x00026; <xref rid="F5" ref-type="fig">5</xref>), and/or that EEEV infection in mosquitoes in Massachusetts increases earlier in the year than it does in Connecticut (<xref rid="F5" ref-type="fig">Figure 5</xref>). Thus, controlling EEEV transmission in Massachusetts may help to alleviate some EEEV transmission in other states.</p><p id="P42">In discussing the movement of EEEV across the US, it is important to note that there is significant sampling bias in our dataset, in terms of both time and location of the sequences. Most of the sequences are from the Northeast US, and there are no sequences from Florida after 2014. While we have attempted to mitigate the latter point by splitting Northeastern clusters with long branches (see Methods), geographical heterogeneity can lead to overconfidence in the transition times<sup><xref rid="R25" ref-type="bibr">25</xref></sup>. Further, the lack of EEEV sequences from other East Coast states may lead to an underestimate of the importance of those states in the spread of EEEV from Florida, and we are unable to examine the introduction or transmission dynamics in any other region of the country. After Florida, the Northeast has the most reported human and horse cases in the US. It therefore has an outsized importance for understanding the dynamics of EEEV. Obtaining data from other EEEV outbreaks (e.g. Michigan) would provide another opportunity to examine the outbreak dynamics. The sequencing of EEEV samples prior to 2003, a wider geographical range of samples in all time periods, and from Florida after 2014 would greatly add to the reliability and resolution of any phylodynamic study of EEEV.</p><p id="P43">While some characteristics of the EEEV outbreak in 2019, such as human case traits and climate factors, were within expected ranges, it is clear that many mosquito factors were unusually high (<xref rid="F5" ref-type="fig">Figure 5</xref>). For example, both Massachusetts and Connecticut had a very high abundance of <italic toggle="yes">Cs. melanura</italic> and the vector index for the latter state was the highest ever recorded. While EEEV has a complex ecology, by using data from detailed mosquito surveillance programs, we were able to find strong connections between mosquito infection rate, abundance (connected to climate factors), and human and horse cases. We then developed and applied a negative binomial regression model to utilize early season values of mosquito-specific predictors (most notably the month of first detection and vector index) to provide early estimates of overall case counts for that year. This important development will provide departments of health with estimates to help direct control strategies, and enable more effective communication of risk to the public.</p><p id="P44">Our models and estimates have several limitations. First, there are more cases in Massachusetts than Connecticut to inform our model. As such, the Connecticut predictions are heavily influenced by Massachusetts case counts, and given the highly localized nature of EEEV, the model may not accurately represent conditions in Connecticut. While vector index is a direct risk estimate of EEEV cases, index P had a greater effect estimate in our model. This could be due to our model not fully accounting for the inherent seasonality of EEEV transmission that overlaps with high values of index P or that the true value of index P, which is modeled with a certain degree of uncertainty, lies a significant distance outside the determined estimate. Due to lack of information on EEEV in <italic toggle="yes">Cs. melanura</italic>, index P is estimated using the transmission probability, bird incubation period, bird infectious period and extrinsic incubation period derived from previous West Nile virus research of <italic toggle="yes">Culex pipiens</italic> species<sup><xref rid="R26" ref-type="bibr">26</xref></sup>. This lack of data for EEEV priors may be confounding the predictive power of this parameter. Finally, veterinary cases are reported voluntarily and the true case counts include interventions undertaken in those years. These interventions include a highly recommended horse vaccination and mosquito spraying: the former will cloud the association between mosquito factors and case counts as exposures may not convert to cases. Both lead to an underestimate of true, unaltered case counts as the model is fitted to partially controlled epidemics.</p><p id="P45">Despite these limitations, on a short timescale, we have some predictive ability of human and horse cases of EEEV (<xref rid="F5" ref-type="fig">Figure 5</xref>). When considering longer timescales, we still cannot use climate-informed models, like index P, for annual predictions of outbreaks. This is because, while climatic factors are vital for the high abundance of <italic toggle="yes">Cs. melanura</italic> required for an intense EEEV year, they cannot predict when the virus will be present. Index P therefore may be a more effective way to predict EEEV case counts in Florida where the virus is continuously maintained<sup><xref rid="R27" ref-type="bibr">27</xref></sup>, but should be used with caution in scenarios where the virus must be introduced.</p><p id="P46">To provide longer-term predictions (i.e. on a time scale of years), we must therefore understand what drives introductions of EEEV from Florida into the Northeast. The missing piece here is large-scale studies on bird immunity, as waves of infection in the Northeastern bird population are likely driven by the renewal of the susceptible population, potentially through birth<sup><xref rid="R9" ref-type="bibr">9</xref>,<xref rid="R28" ref-type="bibr">28</xref></sup>. Theoretically, the dynamics could be similar to those of Middle Eastern Respiratory Syndrome (MERS)<sup><xref rid="R29" ref-type="bibr">29</xref></sup>, wherein cycles of infection due to buildup of susceptibles in the reservoir population leads to spillover events into other species. Certainly, we found that EEEV appears to have waves of introductions into the Northeast which co-circulate before going extinct shortly afterwards, which would be expected from local depletion of susceptible birds.</p><p id="P47">In understanding EEEV outbreaks in humans and horses, we must look to a combination of dynamics of other arboviruses like West Nile and dengue in terms of the mosquito populations, as well as viruses that mostly exist in reservoir populations and spillover into humans, such as MERS. The complex interplay of these factors make long-term prediction with our current data sources difficult, as we do not have enough information on bird immunity and its interaction with EEEV transmission and spillover. We do know, however, that a large mosquito population, enabled by warm and wet conditions, is necessary, and an increase in years with warm and wet summers and mild winters may increase the frequency of outbreaks. Therefore, while the interactions in EEEV with climatic factors are more complex than with some other arboviruses, climate change may still represent an increase in risk as more years will be permissive for outbreaks in mammals. In any case, all of these results rest on a timely and robust mosquito surveillance program, as currently exists in New York, Massachusetts, and Connecticut. Widespread and consistent trapping and rapid analysis provides the data required to calculate vector index, which is the strongest correlate of human and horse cases later in the season. It is imperative that programs like this, also of use for other mosquito-borne viruses such as West Nile virus, continue to be funded and expanded, even as competition for public health funding increases.</p></sec><sec id="S13"><title>STAR Methods</title><sec id="S14"><title>Resource Availability</title><sec id="S15"><title>Lead contact</title><p id="P48">Further information and requests for resources should be directed to and will be fulfilled by the lead contact Nathan Grubaugh (<email>nathan.grubaugh@yale.com</email>).</p></sec><sec id="S16"><title>Materials availability</title><p id="P49">This study did not generate new unique reagents</p></sec><sec sec-type="data-availability" id="S17"><title>Data and code availability</title><list list-type="bullet" id="L1"><list-item><p id="P50">New EEEV genomes have been deposited in Genbank and are publicly available as of the date of publication. Accession numbers are listed in the <xref rid="T1" ref-type="table">key resources table</xref>. Case data for EEE, the disease caused by EEEV, is existing, publicly available data. It is a notifiable disease and so human case data is routinely reported to the federal government. This surveillance data is available from ArboNET, on request from the CDC <ext-link xlink:href="https://wwwn.cdc.gov/arbonet/maps/ADB_Diseases_Map/index.html" ext-link-type="uri">https://wwwn.cdc.gov/arbonet/maps/ADB_Diseases_Map/index.html</ext-link>. Case data that we combed from the literature is summarized at <ext-link xlink:href="https://github.com/grubaughlab/eeev-genomics" ext-link-type="uri">https://github.com/grubaughlab/eeev-genomics</ext-link>. Original shape files for generating maps are publicly available from <ext-link xlink:href="https://gadm.org/" ext-link-type="uri">gadm.org</ext-link>. Bird banding data is publicly available and can be found here: <ext-link xlink:href="10.5066/P9BSM38F" ext-link-type="doi">https://doi.org/10.5066/P9BSM38F</ext-link>. Mosquito data cannot be shared in a public repository due to data protection issues. It is available on request to Alexander Ciota (New York state, <email>alexander.ciota@ny.gov</email>), Philip Armstrong (Connecticut, <email>philip.armstrong@ct.gov</email>) or Sandra Smole (Massachusetts, <email>sandra.smole@state.ma.us</email>).</p></list-item><list-item><p id="P51">All original code, including BEAST XMLs, has been deposited in a Github repository at <ext-link xlink:href="https://github.com/grubaughlab/eeev-genomics" ext-link-type="uri">https://github.com/grubaughlab/eeev-genomics</ext-link> and is publicly available as of the date of publication.</p></list-item><list-item><p id="P52">Any additional information required to reanalyze the data reported in this paper is available from the lead contact upon request.</p></list-item></list></sec></sec><sec id="S18"><title>Method details</title><sec id="S19"><title>Ethics</title><p id="P53">No human samples or direct clinical data were used in this study. Sequencing of remnant veterinarian samples by the Wadsworth Center were done following institutional protocols. All data are available through aggregated surveillance databases as described below.</p></sec><sec id="S20"><title>Mosquito surveillance</title><p id="P54">In New York State (NYS), since 2012 (including 2019), 13 counties representing all regions of NYS have been surveilled, as previously described <sup><xref rid="R30" ref-type="bibr">30</xref></sup>. In total, &#x0003e;100,000 pooled individuals representing 53 species are tested for EEEV each year, this includes ~15,000 pooled Cs. melaura annually, which are predominantly trapped in the main EEEV/<italic toggle="yes">Cs. melanura</italic> focus including Oswego, Oneida, Onondaga and Madison Counties. Trapping was completed using a combination of Centers for Disease Control and Prevention (CDC) light traps, gravid traps and diurnal resting boxes. Resting boxes were primarily used in EEEV endemic areas to collect <italic toggle="yes">Cs. melanura</italic>. Mosquito specimens were sorted by species and pooled for testing. Pools of 10&#x02013;60 mosquitoes were shipped on dry ice to the NYS Arbovirus Laboratory for EEEV testing by molecular and cellular methods. Specifically, pools containing a zinc-plated steel bead and 1ml mosquito diluent (20% heat-inactivated fetal bovine serum (FBS) in Dulbecco&#x02019;s phosphate-buffered saline plus 50 &#x003bc;g/mL penicillin/streptomycin, 50 &#x003bc;g/mL gentamicin, and 2.5 &#x003bc;g/mL Fungizone) were homogenized using a mixer mill for 30 sec at 24Hz and centrifuged for 5 min at 6000 rcf. Quantitative reverse transcriptase polymerase chain reactions (qRT-PCR) were performed using two distinct primer and probe sets, following RNA extraction and purification, as previously described<sup><xref rid="R31" ref-type="bibr">31</xref></sup>. In addition, 100 &#x003bc;L of supernatant from <italic toggle="yes">Cs. melanura</italic> pools were inoculated on Vero cell culture and monitored for cytopathic effect. EEEV isolates obtained from a single round of amplification were used for sequencing.</p><p id="P55">In Massachusetts, mosquito surveillance was conducted from mid-May through to mid-October, as previously described<sup><xref rid="R32" ref-type="bibr">32</xref>,<xref rid="R33" ref-type="bibr">33</xref></sup>. Trapping was performed by the Massachusetts Department of Public Health (MDPH) in collaboration with 10 local mosquito control projects (MCP) at semi-variable frequencies visiting non-fixed trap sites spread across all 14 counties. Site visitation frequency increased with high volume collections of vector species and narrowed to weekly-biweekly over time in correlation with increased site-specific target mosquito abundance. Targeted sites visitation frequency increased to weekly at minimum when EEEV activity was detected and persisted through the duration of the seasonal surveillance period. Weekly collections were performed at 10 fixed collection sites in Bristol and Plymouth counties known to be historically active EEEV sentinel sites. These site collections increased to twice a week after initial EEEV detection.</p><p id="P56">Mosquito collection methods varied depending on MCP, however nearly all successful <italic toggle="yes">Cs. melanura</italic> collections were performed using primarily CDC-Miniature Light traps with a CO<sub>2</sub> source (either dry ice or regulated tank flow ranging from 250&#x02013;500cc), gravid traps baited with an infusion of lactalbumin-yeast-hay with oak leaves, or resting boxes placed primarily in locales with both deciduous and evergreen freshwater forested swamps. Light traps and gravid traps were placed in the early morning-late afternoon and retrieved 24 hours later, and resting boxes were visited once weekly. Mosquito trap canisters collected from the field were transported to the laboratory in an igloo cooler lined with dry ice, freeze-killed in an ultra-low &#x02212;80&#x000b0;C freezer, identified by species using a dichotomous key to characterize morphological differences with a stereoscope, and pooled in sample vials of 5&#x02013;50 female mosquitoes. Sample pools were grouped by species/trap site/date of collection before being submitted to the MDPH Molecular Diagnostics lab for arbovirus testing.</p><p id="P57">In Connecticut, mosquito trapping and arbovirus surveillance was conducted from the beginning of June through the end of October at 91 fixed collection sites, distributed among all 8 counties, as previously described in <sup><xref rid="R34" ref-type="bibr">34</xref></sup>. Trapping locations, where <italic toggle="yes">Cs. melanura</italic> were likely to be collected or where there was historical record of EEEV activity, were established in sparsely populated rural settings that included permanent fresh-water swamps (red maple/white cedar) and bogs, coastal salt marshes, horse stables, and swamp-forest border environs. Additional trap sites are located in more densely populated urban or suburban locales, including parks, greenways, golf courses, undeveloped wood lots, sewage treatment plants, dumping stations, and temporary wetlands associated with waterways.</p><p id="P58">Mosquito trapping was conducted with CO<sub>2</sub> (dry ice)-baited CDC miniature light traps equipped with aluminum domes or gravid mosquito traps baited with a lactalbumin-yeast-hay infusion. Traps were placed in the field in the afternoon, operated overnight, and retrieved the following morning. Trapping frequency was minimally made once every ten days at each trap site over the course of the entire season. Mosquito trapping frequency was increased at EEEV-positive sites to twice per week after the virus was isolated from that site. Adult mosquitoes were transported alive to the laboratory each morning in an ice chest lined with cool packs. Mosquitoes were immobilized with dry ice and transferred to chill tables where they were identified to species with the aid of a stereo microscope (90X) based on morphological characters. Female mosquitoes were pooled in groups of 50 or fewer by species, collection date, trap type, and collection site and stored at &#x02212;80&#x000b0;C until processed for virus isolation. Processed mosquito pools were inoculated into Vero cell cultures and screened for cytopathic effect (CPE) as previously described<sup><xref rid="R35" ref-type="bibr">35</xref></sup>. CPE positive virus cultures and the original mosquito pool were then tested for EEEV by TaqMan RT-PCR assay<sup><xref rid="R36" ref-type="bibr">36</xref></sup>.</p></sec><sec id="S21"><title>RNA isolation and virus sequencing</title><p id="P59">RNA was extracted on the MagMax-96 Express robot (Applied Biosystems, Foster City, CA) with the Magmax Viral isolation kit (ThermoFisher Scientific, Waltham, MA), according to manufacturer&#x02019;s specifications. 50 &#x003bc;L of sample was added to 130 &#x003bc;L of lysis buffer containing 20 &#x003bc;L of RNA binding beads diluted 1:1 with wash buffer. RNA was eluted in 90 &#x003bc;L of elution buffer. Primer pairs (<xref rid="SD1" ref-type="supplementary-material">Table S5</xref>) were used to generate 6 overlapping fragments of approximately 2.5 kb each using one-step superscript III RT&#x02013;PCR with platinum Taq (Life Technologies, Carlsbad, CA). Each reaction utilized 5 &#x003bc;L of RNA, 1 &#x003bc;L of enzyme, and a 0.4 &#x003bc;M final concentration of primer pairs in a total reaction volume of 25 &#x003bc;L. Thermocycler amplification was completed using the following conditions: 55&#x000b0;C for 30 min; 94&#x000b0;C for 2 min; 40 cycles of 94&#x000b0;C for 15 sec, 55&#x000b0;C for 30 sec, 68&#x000b0;C for 3.5 min; and a final extension of 68 &#x000b0;C for 10 min (Simpliamp by Applied Biosystems, Waltham, MA). Two uL of amplicons were visualized on a 1% agarose gel to confirm size and quality, and subsequently purified using Zymo DNA Clean and Concentrate (Zymo Research, Irvine, CA). Amplicons from individual isolates were pooled and sent to the Wadsworth Center Advanced Genomic Technologies Core for library preparation and indexing using the Nextera XT kit (Illumina, San Diego, CA) according to manufacturer&#x02019;s protocols.</p><p id="P60">Sequencing was performed on the Illumina MiSeq platform (San Diego, CA). Paired-end reads were assembled to a 2014 Connecticut isolate from <italic toggle="yes">Cs. melanura</italic> (KX029260) deploying Geneious Prime&#x02019;s reference mapping tool with high sensitivity and free end gaps using 10 iterations of fine tuning and trimming paired read overhangs. Mean coverage/base ranged from 703&#x02013;2132x. Resultant consensus sequences were used for downstream analyses. We generated complete genome consensus sequences for all 80 sequenced isolates.</p></sec><sec id="S22"><title>Nucleotide alignments and phylogenetic analysis</title><p id="P61">In total, 80 new samples of EEEV were sequenced from 2015&#x02013;2019. 451 additional whole genome sequences from prior to this study were downloaded from Genbank (see <xref rid="SD1" ref-type="supplementary-material">Table S6</xref>). Those not from the US and without location data were removed, and the remaining combined with the new sequences to give a dataset of 523 sequences.</p><p id="P62">We aligned the sequences using Mafft version 1.3.7<sup><xref rid="R37" ref-type="bibr">37</xref></sup>, and removed the non-coding regions at either end of the genome, giving a final multiple sequence alignment with a length of 11,277 bases. A maximum-likelihood phylogenetic tree was generated using IQ-TREE 2.1.4<sup><xref rid="R38" ref-type="bibr">38</xref></sup> using an HKY substitution model and temporal signal was assessed in TempEst<sup><xref rid="R39" ref-type="bibr">39</xref></sup>. A single molecular clock outlier (ID: AY722102) was removed, as described in<sup><xref rid="R40" ref-type="bibr">40</xref></sup>.</p><p id="P63">We estimated introductions into the Northeast (defined as New York, Connecticut, Massachusetts, New Hampshire, Vermont, Rhode Island and Maine) by conducting a discrete trait phylogeographic analysis (DTA) at the state level in BEAST 1.10<sup><xref rid="R41" ref-type="bibr">41</xref></sup>, with an asymmetric CTMC model. We also used a non-parametric skygrid coalescent model<sup><xref rid="R16" ref-type="bibr">16</xref></sup> estimated using Hamiltonian Monte Carlo sampling<sup><xref rid="R42" ref-type="bibr">42</xref></sup>, an HKY substitution model<sup><xref rid="R43" ref-type="bibr">43</xref></sup>, and a strict clock model<sup><xref rid="R44" ref-type="bibr">44</xref></sup>. We used tip-date sampling for those sequences without exact sampling dates, with a starting date given as 0.6 of the way through the appropriate year (i.e. August) with a standard deviation of three months. We estimate Markov jump histories for the full posterior to obtain estimates of location transitions between states in the DTA, and summarize them using TaxaMarkovJumpHistoryAnalyzer<sup><xref rid="R45" ref-type="bibr">45</xref></sup>. We performed two independent replicates of this analysis, with each chain running for 100 million iterations, removing 10% for burn-in. Convergence and mixing were assessed in Tracer 1.7<sup><xref rid="R46" ref-type="bibr">46</xref></sup>. Further, we found a strong temporal signal for this dataset (<xref rid="SD1" ref-type="supplementary-material">Figure S1</xref>) with an estimated evolutionary rate of 1.86&#x000d7;10<sup>&#x02212;4</sup> (95% HPD: 1.77&#x000d7;10<sup>&#x02212;4</sup>-1.95&#x000d7;10<sup>&#x02212;4</sup>) substitutions per site per year, in line with previous estimates<sup><xref rid="R12" ref-type="bibr">12</xref></sup>.</p><p id="P64">An introduction node was considered to be the first node which was inferred to be in one of the Northeastern states and downstream tips were counted as part of the cluster. One introduction left Massachusetts and returned to Florida. As this is unlikely given bird migration patterns, and the confidence in the location of the node was low (52% Massachusetts, 46% Florida), we instead used the child node which was found in Massachusetts, thereby excluding the Florida sequence from this cluster.</p><p id="P65">As there are no sequences from Florida (which was estimated to be the backbone of the phylogeny) after 2014, and relatively few before, the DTA will underestimate the number of introductions in total as they will not be broken up by Florida sequences. The date of the introduction node (the first node in the cluster inferred to be in the Northeast) will therefore also be too far in the past, as the lack of Florida sequences in the cluster means that the location of the node is inferred incorrectly. Therefore, we set out to split up some introductions which contained long branches and likely represented unsampled Floridian diversity. We identified all of the clusters which contained tips only from the Northeast with more than three sequences and more than 50% of the sequences sampled in 2014 or earlier (i.e. when the last Floridian sequence was sampled); and calculated their average branch length (1.28 years). We then traversed the tree, and for any branches where both the parent and child node were inferred to be in the Northeast, but were more than twice the standard deviation (1.52 years) above the average branch length (threshold = 4.33 years), we assigned the introduction node as the child of the pair instead of the parent. This therefore moved the introduction node closer to the present, and sometimes excluded Northeastern sequences on the sister branch, making separate introductions. The final number of introductions into the Northeast before this procedure was 42 prior to 2014 and 19 after, and 49 and 26 respectively, adding 14 more introductions in total.</p><p id="P66">To test for nucleotide substitutions common to 2019 sequences, we compared the consensus sequences to the reference sequence used in<sup><xref rid="R47" ref-type="bibr">47</xref></sup>, which has Genbank accession ID KJ469556.</p><p id="P67">We have also built a Nextstrain page to further explore the data, which can be found at <ext-link xlink:href="https://www.zlab.bio/guide-design-resourcesnextstrain.org/community/grubaughlab/eeev-genomics" ext-link-type="uri">nextstrain.org/community/grubaughlab/eeev-genomics</ext-link>.</p></sec><sec id="S23"><title>Mosquito transmission suitability model - index P</title><p id="P68">Index P is an estimate of the transmission potential by a single female mosquito using Bayesian methods and mosquito-virus specific priors (<xref rid="SD1" ref-type="supplementary-material">Table S3</xref>), including transmission probability as a function of temperature and relative humidity. Unlike the basic reproduction number, R<sub>0</sub>, index P does not need to be greater than one to cause sustained transmission, as index P is multiplied by the ratio of human to mosquitoes to derive R<sub>0</sub>. We estimated the variable index P using the Mosquito Virus Suitability Estimator (MVSE), an R package to download the functions for modeling the suitability of a given environment for mosquito-borne virus transmission<sup><xref rid="R23" ref-type="bibr">23</xref></sup>. Temperature and humidity data for each state were calculated by taking the average temperature for each day in the center of each county in the state. These county level data were then averaged to obtain a single temperature estimate for the entire state. All weather data were provided by <ext-link xlink:href="https://www.visualcrossing.com/" ext-link-type="uri">visualcrossing.com</ext-link>. Index P was calculated from April to October, in line with the transmission season for EEEV. All negative temperatures were set to zero in the model to avoid erroneous results, as at zero or below, mosquitoes are in a hibernation state and so there is no mosquito activity that varies by temperature.</p><p id="P69">We used a 1 month lag time from index P to cases to account for delays caused by requiring transmission into humans and horses, followed by incubation times and time to diagnosis. Therefore the relevant mosquito activity will be before human and horse cases are reported.</p><p id="P70">While index P is seen as an important covariate in the negative binomial regression model, it is difficult to tease out the seasonality of the mosquito season with cases. Due to the sporadic nature of EEEV in the Northeast, index P is a necessary but not sufficient parameter to consider. To test whether temperature could be used as a proxy, an additional model was tested by replacing index P with temperature which resulted in a slightly higher Akaike information criterion (AIC) score (231.4 vs 232.3) and wider confidence interval. Given the widespread use of modeled mosquito viability parameters, we opted to keep index P. However, future research and surveillance programs may wish to utilize temperature, an easily obtained parameter with little uncertainty in its estimate.</p></sec><sec id="S24"><title>Regression model fit to cases</title><p id="P71">We restricted the case data (described above) to Connecticut and Massachusetts for the model where we had sufficient mosquito data to calculate the Vector Index. Dispersion was detected with a dispersion parameter alpha = 0.18 (p-value = 0.019) using the dispersion test from the AER package in R <sup><xref rid="R48" ref-type="bibr">48</xref></sup>. This led us to fit a negative binomial regression model (estimated using ML) to predict human_equine with vector_index (formula: human_equine ~ vector_index + month_detected_july + indexP_lag1 + st_grp + year_index + month_f).</p><p id="P72">Given the vast differences in cases between Massachusetts and Connecticut we attempted to run stratified models of each state separately. However the model failed to converge for Connecticut, likely due to low availability of cases. Thus a model combining both was used. Months were included as categorical variables with the months May through July as reference groups. These months were combined due to May and June having no cases, making parameter estimates fail to converge when separate. The parameter &#x02018;first month detected July&#x02019; was a binary variable determined by identifying the month when the first non-zero value for the vector index occurred for each year. All continuous data were normalized so interpretation of estimates are for a 1 standard deviation increase in the term.</p><p id="P73">Effect modification of vector index by month of detection was explored in addition to the original model without effect modification. AIC scores of the model with effect modification and without were nearly identical (231.4 vs 231.2 respectively) and an ANOVA test was conducted between the two models and found to have no difference (p-value = 0.14). While no difference was identified, this may be due in part to the small sample size of years where the month detected was after July.</p><p id="P74">In addition to effect modification, given some of the complexity of index P, we explored the terms temperature 1-month lag and mosquito abundance 1-month lag in replacement of index P. Utilizing the two point rule of thumb for AIC, the abundance model performed worse (231.4 vs 233.2) and its estimate was not significant (CI 95%: 0.57&#x02013;1.62). The temperature performed slightly worse but similar to the index P model (AIC 231.4 vs 232.3) but had a larger standard error (CI 95%: 1.15&#x02013;9.31). Given the desire to explore the utility of index P and its higher performance we opted to focus on this model. However, for simplicity sake future work may utilize temperature for its ease of use and similar performance (<xref rid="SD1" ref-type="supplementary-material">Figure S6</xref> and <xref rid="SD1" ref-type="supplementary-material">Table S4</xref>).</p><p id="P75">Utilizing the DHARMa version 0.4.6 package in R (<ext-link xlink:href="https://cran.r-project.org/package=DHARMa" ext-link-type="uri">https://CRAN.R-project.org/package=DHARMa</ext-link>), we simulated the residuals 1,000 times to test for heteroskedasticity, zero inflation, and autocorrelation. Upon visual inspection no heteroskedasticity of the residuals was detected. The simulated ratio of expected to actual zeros was 1.01 (p-value = 0.776) The Durbin-Watson test for autocorrelation was conducted on a subset of the Massachusetts data to avoid duplicate time indexes. In addition to subsetting the data, index P with and without a 1-month lag was tested per the suggestion of the Durbin-Watson test to avoid lagging covariates. Autocorrelation was borderline but insignificant without the index P lag (DW = 1.59, p-value = 0.051).</p><p id="P76">It must be noted that our model was restricted to a monthly time scale to match monthly case data. Given the short duration of the EEEV transmission season, certain dynamics may be missed on the weekly or even daily timescale. There was not enough case data within each month to explore impacts of detection on a month by month basis, making the month detection piece of the analysis less specific.</p></sec></sec><sec id="S25"><title>Quantification and statistical analysis</title><sec id="S26"><title>Maximum-likelihood estimation of infection rate, relative abundance, and vector index</title><p id="P77">The maximum-likelihood estimation (MLE) of the infection rate is a pooled infection rate of positive EEEV pools, and was estimated using the CDC R software package PooledInfRate (<ext-link xlink:href="https://github.com/CDCgov/PooledInfRate" ext-link-type="uri">https://github.com/CDCgov/PooledInfRate</ext-link>). This estimation procedure takes into account that there may be different numbers of positive mosquitoes in each positive pool, and so estimates the likely number of positive mosquitoes in each pool based on the overall number of positive pools. The relative abundance was calculated as the average number of mosquitoes captured per trap per night. Vector index is these two metrics multiplied together <sup><xref rid="R21" ref-type="bibr">21</xref>,<xref rid="R22" ref-type="bibr">22</xref></sup>.</p></sec><sec id="S27"><title>Virus effective population size using a skygrid model</title><p id="P78">To identify any possible associations between effective population size and case counts, we applied the latter as covariates to the estimation of population size using the skygrid model<sup><xref rid="R17" ref-type="bibr">17</xref></sup>. We began by comparing 12 possible covariates (all human and animal cases, just human cases, just horse cases, and all cases in Massachusetts, Connecticut, and New York with 0, 1 and 2 year lags) to effective population estimated sizes using a skygrid model with no covariates<sup><xref rid="R16" ref-type="bibr">16</xref></sup>. On the basis of this preliminary analysis, we ran formal analyses with all cases, human cases, and horse cases and the relevant lags. We also only used sequence and case data from 2003 onwards (n=423), when the surveillance program began, in order to eliminate some noise from the data. BEAST runs were set up as above with tip-date sampling, HKY substitution models and a non-parametric skygrid coalescent model. Grid points were externally set to correspond to the start of each year.</p><p id="P79">Case counts for years between the inferred time of origin of the tree and 2003 were estimated independently using a normal prior, whose mean is the recorded case count. The standard deviation was calculated such that all national cases and horse case covariates were allowed to have &#x000b1;5 cases in the 95% confidence interval; and human covariates were allowed to have &#x000b1;1 cases in the same interval, as the recording of the latter is more precise. This was also undertaken for 2021 data for both analyses with the 2 year lag covariates, as finalized data has not been released by ArboNET at time of writing.</p><p id="P80">Starting values for unobserved years were taken from news reports and other publicly available sources. Most of the researched outbreaks were reported in Corrin <italic toggle="yes">et al,</italic> 2021<sup><xref rid="R49" ref-type="bibr">49</xref></sup>, and data were supplemented by going to each of the references given in that paper. Data for outbreaks in Michigan were supplemented by information in<sup><xref rid="R50" ref-type="bibr">50</xref></sup>, and Massachusetts data were supplemented using Stobierski <italic toggle="yes">et al</italic> 2022, Grady <italic toggle="yes">et al</italic> 1978 and Feemster <italic toggle="yes">et al</italic> 1938<sup><xref rid="R51" ref-type="bibr">51</xref>&#x02013;<xref rid="R53" ref-type="bibr">53</xref></sup>. Data for all states were supplemented using CDC Morbidity and Mortality Weekly reports in relevant years. Horse cases used are both confirmed and suspected, due to a lack of equine testing, especially in the earlier epidemics.</p></sec><sec id="S28"><title>Human outdoorness measurements</title><p id="P81">How much time people spent indoors or outdoors was taken from Susswein <italic toggle="yes">et al</italic> 2022<sup><xref rid="R18" ref-type="bibr">18</xref></sup>, who used anonymized GPS data from mobile phones. This data was only available for 2018 and 2019. We took the average indoor/outdoorness for each county which had a case in 2019, or had ever had a case and performed a dependent t-test in Python for paired samples to compare the metric between years. Significance was taken to be a p-value of less than 0.05.</p></sec><sec id="S29"><title>Bird abundance</title><p id="P82">Bird banding data to calculate abundance and proportion were obtained from the North American Bird Banding Program dataset<sup><xref rid="R54" ref-type="bibr">54</xref></sup>. All ages of birds were used. Bird species were selected using data from Kramer <italic toggle="yes">et al</italic> 2015<sup><xref rid="R20" ref-type="bibr">20</xref></sup>, who calculated the relative feeding preference of <italic toggle="yes">Cs. melanura</italic> in Connecticut using a blood meal analysis and normalizing it by abundance of the bird species in question. High-preference birds in this analysis were the 8 species identified in this paper, and low-preference birds were randomly selected from their list of birds for which <italic toggle="yes">Cs. melanura</italic> appeared to have no preference. We conducted Poisson regressions in Python for each combination for the abundance or proportion of a bird species in a given year against the human and horse cases or mosquito infection rate (both defined above). A 5% significance level was used.</p></sec></sec></sec><sec sec-type="supplementary-material" id="SM1"><title>Supplementary Material</title><supplementary-material id="SD1" position="float" content-type="local-data"><label>Supplementary information</label><media xlink:href="NIHMS1907424-supplement-Supplementary_information.pdf" id="d64e1283" position="anchor"/></supplementary-material><supplementary-material id="SD2" position="float" content-type="local-data"><label>Table S1</label><caption><p id="P83">Table S1 | Metadata for newly sequenced EEEV isolates, related to <xref rid="F2" ref-type="fig">Figure 2</xref></p></caption><media xlink:href="NIHMS1907424-supplement-Table_S1.xlsx" id="d64e1291" position="anchor"/></supplementary-material></sec></body><back><ack id="S30"><title>Acknowledgements</title><p id="P84">We thank the seasonal mosquito surveillance programs from Connecticut, Massachusetts, and each county in New York, Wadsworth Center Advanced Genomic Technologies Core for assistance with sequencing, D. Weinberger for help with the statistical model, J. Howard for his thoughts, and P. Jack and S. Taylor for providing comments on an early draft. Research reported in this publication was supported by the National Institute Of Allergy And Infectious Diseases of the National Institutes of Health under Award Number DP2AI176740 (NDG), CTSA Grant Number UL1 TR001863 from the National Center for Advancing Translational Science (NCATS), a component of the National Institutes of Health (CBFV), the Cooperative Agreement Number U01CK000509 funded by the Centers for Disease Control and Northeast Center of Excellence (PMA, ATC), the KU Leuven Internal Funds Grant No. C14/18/094 (GB), and the Research Foundation - Flanders award &#x0201c;Fonds voor Wetenschappelijk Onderzoek - Vlaanderen,&#x0201d; G0E1420N, G098321N (GB). The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health or the Centers for Disease Control and Prevention.</p></ack><fn-group><fn fn-type="COI-statement" id="FN4"><p id="P85">Declarations of interest</p><p id="P86">The authors declare no conflicts of interest related to this work.</p></fn><fn id="FN5"><p id="P87" content-type="publisher-disclaimer">This is a PDF file of an unedited manuscript that has been accepted for publication. As a service to our customers we are providing this early version of the manuscript. The manuscript will undergo copyediting, typesetting, and review of the resulting proof before it is published in its final form. Please note that during the production process errors may be discovered which could affect the content, and all legal disclaimers that apply to the journal pertain.</p></fn></fn-group><ref-list><title>References</title><ref id="R1"><label>1.</label><mixed-citation publication-type="journal">Giltner, and Shahan (<year>1933</year>). <article-title>The 1933 outbreak of infectious equine encephalomyelitis in the eastern states</article-title>. <source>North Am. Vet</source>.</mixed-citation></ref><ref id="R2"><label>2.</label><mixed-citation publication-type="journal"><name><surname>TenBroeck</surname><given-names>C</given-names></name>, and <name><surname>Merrill</surname><given-names>MH</given-names></name> (<year>1933</year>). <article-title>A serological difference between eastern and western equine encephalomyelitis virus</article-title>. <source>Proc. Soc. Exp. Biol. Med</source>. <volume>31</volume>.</mixed-citation></ref><ref id="R3"><label>3.</label><mixed-citation publication-type="journal"><name><surname>Lindsey</surname><given-names>NP</given-names></name>, <name><surname>Erin Staples</surname><given-names>J</given-names></name>, and <name><surname>Fischer</surname><given-names>M</given-names></name> (<year>2018</year>). <article-title>Eastern Equine Encephalitis Virus in the United States, 2003&#x02013;2016</article-title>. <source>Am. J. Trop. Med. Hyg</source>. <volume>98</volume>, <fpage>1472</fpage>.<pub-id pub-id-type="pmid">29557336</pub-id></mixed-citation></ref><ref id="R4"><label>4.</label><mixed-citation publication-type="journal"><name><surname>Lindsey</surname><given-names>NP</given-names></name>, <name><surname>Martin</surname><given-names>SW</given-names></name>, <name><surname>Staples</surname><given-names>JE</given-names></name>, and <name><surname>Fischer</surname><given-names>M</given-names></name> (<year>2020</year>). <article-title>Notes from the Field: Multistate Outbreak of Eastern Equine Encephalitis Virus - United States, 2019</article-title>. <source>MMWR Morb. Mortal. Wkly. Rep</source>. <volume>69</volume>, <fpage>50</fpage>&#x02013;<lpage>51</lpage>.<pub-id pub-id-type="pmid">31945032</pub-id></mixed-citation></ref><ref id="R5"><label>5.</label><mixed-citation publication-type="book"><name><surname>Shamus</surname><given-names>KJ</given-names></name> (<year>2019</year>). <source>Deaths from mosquito-borne EEE virus prompt calls to cancel outdoor events in Michigan</source>. <publisher-name>USA Today</publisher-name>.</mixed-citation></ref><ref id="R6"><label>6.</label><mixed-citation publication-type="webpage"><name><surname>Tunison</surname><given-names>J</given-names></name> (<year>2019</year>). <article-title>Despite assurances, aerial mosquito spraying plan leaves some concerned</article-title>. <source>mlive</source>. <comment><ext-link xlink:href="https://www.mlive.com/news/kalamazoo/2019/09/despite-assurances-aerial-mosquito-spraying-plan-leaves-some-concerned.html" ext-link-type="uri">https://www.mlive.com/news/kalamazoo/2019/09/despite-assurances-aerial-mosquito-spraying-plan-leaves-some-concerned.html</ext-link></comment>.</mixed-citation></ref><ref id="R7"><label>7.</label><mixed-citation publication-type="book"><name><surname>Howard</surname><given-names>J</given-names></name> (<year>2019</year>). <source>Why did EEE cases spike this year? It&#x02019;s complicated</source>. <publisher-name>CNN</publisher-name>. <comment><ext-link xlink:href="https://www.cnn.com/2019/10/03/health/eee-outbreak-2019-cause/index.html" ext-link-type="uri">https://www.cnn.com/2019/10/03/health/eee-outbreak-2019-cause/index.html</ext-link></comment>.</mixed-citation></ref><ref id="R8"><label>8.</label><mixed-citation publication-type="book"><name><surname>Morris</surname><given-names>CD</given-names></name> (<year>1988</year>). <part-title>Eastern equine encephalomyelitis</part-title>. In <source>The Arboviruses: epidemiology and ecology</source>, <name><surname>Monath</surname><given-names>TP</given-names></name>, ed. (<publisher-name>CRC Press</publisher-name>), pp. <fpage>1</fpage>&#x02013;<lpage>20</lpage>.</mixed-citation></ref><ref id="R9"><label>9.</label><mixed-citation publication-type="journal"><name><surname>Armstrong</surname><given-names>PM</given-names></name>, and <name><surname>Andreadis</surname><given-names>TG</given-names></name> (<year>2022</year>). <article-title>Ecology and Epidemiology of Eastern Equine Encephalitis Virus in the Northeastern United States: An Historical Perspective</article-title>. <source>J. Med. Entomol</source>. <volume>59</volume>. <pub-id pub-id-type="doi">10.1093/jme/tjab077</pub-id>.</mixed-citation></ref><ref id="R10"><label>10.</label><mixed-citation publication-type="journal"><name><surname>Molaei</surname><given-names>G</given-names></name>, <name><surname>Oliver</surname><given-names>J</given-names></name>, <name><surname>Andreadis</surname><given-names>TG</given-names></name>, <name><surname>Armstrong</surname><given-names>PM</given-names></name>, and <name><surname>Howard</surname><given-names>JJ</given-names></name> (<year>2006</year>). <article-title>Molecular identification of blood-meal sources in Culiseta melanura and Culiseta morsitans from an endemic focus of eastern equine encephalitis virus in New York</article-title>. <source>Am. J. Trop. Med. Hyg</source>. <volume>75</volume>, <fpage>1140</fpage>&#x02013;<lpage>1147</lpage>.<pub-id pub-id-type="pmid">17172382</pub-id></mixed-citation></ref><ref id="R11"><label>11.</label><mixed-citation publication-type="journal"><name><surname>Mundis</surname><given-names>SJ</given-names></name>, <name><surname>Harrison</surname><given-names>S</given-names></name>, <name><surname>Pelley</surname><given-names>D</given-names></name>, <name><surname>Durand</surname><given-names>S</given-names></name>, and <name><surname>Ryan</surname><given-names>SJ</given-names></name> (<year>2022</year>). <article-title>Spatiotemporal Environmental Drivers of Eastern Equine Encephalitis Virus in Central Florida: Towards a Predictive Model for a Lethal Disease</article-title>. <source>J. Med. Entomol</source>. <pub-id pub-id-type="doi">10.1093/jme/tjac113</pub-id>.</mixed-citation></ref><ref id="R12"><label>12.</label><mixed-citation publication-type="journal"><name><surname>Tan</surname><given-names>Y</given-names></name>, <name><surname>Lam</surname><given-names>TT-Y</given-names></name>, <name><surname>Heberlein-Larson</surname><given-names>LA</given-names></name>, <name><surname>Smole</surname><given-names>SC</given-names></name>, <name><surname>Auguste</surname><given-names>AJ</given-names></name>, <name><surname>Hennigan</surname><given-names>S</given-names></name>, <name><surname>Halpin</surname><given-names>RA</given-names></name>, <name><surname>Fedorova</surname><given-names>N</given-names></name>, <name><surname>Puri</surname><given-names>V</given-names></name>, <name><surname>Stockwell</surname><given-names>TB</given-names></name>, <etal/> (<year>2018</year>). <article-title>Large-Scale Complete-Genome Sequencing and Phylodynamic Analysis of Eastern Equine Encephalitis Virus Reveals Source-Sink Transmission Dynamics in the United States</article-title>. <source>J. Virol</source>. <volume>92</volume>. <pub-id pub-id-type="doi">10.1128/JVI.00074-18</pub-id>.</mixed-citation></ref><ref id="R13"><label>13.</label><mixed-citation publication-type="journal"><name><surname>Young</surname><given-names>DS</given-names></name>, <name><surname>Kramer</surname><given-names>LD</given-names></name>, <name><surname>Maffei</surname><given-names>JG</given-names></name>, <name><surname>Dusek</surname><given-names>RJ</given-names></name>, <name><surname>Backenson</surname><given-names>PB</given-names></name>, <name><surname>Mores</surname><given-names>CN</given-names></name>, <name><surname>Bernard</surname><given-names>KA</given-names></name>, and <name><surname>Ebel</surname><given-names>GD</given-names></name> (<year>2008</year>). <article-title>Molecular epidemiology of eastern equine encephalitis virus, New York</article-title>. <source>Emerg. Infect. Dis</source>. <volume>14</volume>, <fpage>454</fpage>&#x02013;<lpage>460</lpage>.<pub-id pub-id-type="pmid">18325261</pub-id></mixed-citation></ref><ref id="R14"><label>14.</label><mixed-citation publication-type="journal"><name><surname>Oliver</surname><given-names>J</given-names></name>, <name><surname>Tan</surname><given-names>Y</given-names></name>, <name><surname>Haight</surname><given-names>JD</given-names></name>, <name><surname>Tober</surname><given-names>KJ</given-names></name>, <name><surname>Gall</surname><given-names>WK</given-names></name>, <name><surname>Zink</surname><given-names>SD</given-names></name>, <name><surname>Kramer</surname><given-names>LD</given-names></name>, <name><surname>Campbell</surname><given-names>SR</given-names></name>, <name><surname>Howard</surname><given-names>JJ</given-names></name>, <name><surname>Das</surname><given-names>SR</given-names></name>, <etal/> (<year>2020</year>). <article-title>Spatial and temporal expansions of Eastern equine encephalitis virus and phylogenetic groups isolated from mosquitoes and mammalian cases in New York State from 2013 to 2019</article-title>. <source>Emerg. Microbes Infect</source>. <volume>9</volume>, <fpage>1638</fpage>&#x02013;<lpage>1650</lpage>.<pub-id pub-id-type="pmid">32672516</pub-id></mixed-citation></ref><ref id="R15"><label>15.</label><mixed-citation publication-type="journal"><name><surname>Morens</surname><given-names>DM</given-names></name>, <name><surname>Folkers</surname><given-names>GK</given-names></name>, and <name><surname>Fauci</surname><given-names>AS</given-names></name> (<year>2019</year>). <article-title>Eastern Equine Encephalitis Virus - Another Emergent Arbovirus in the United States</article-title>. <source>N. Engl. J. Med</source>. <volume>381</volume>, <fpage>1989</fpage>&#x02013;<lpage>1992</lpage>.<pub-id pub-id-type="pmid">31747726</pub-id></mixed-citation></ref><ref id="R16"><label>16.</label><mixed-citation publication-type="journal"><name><surname>Gill</surname><given-names>MS</given-names></name>, <name><surname>Lemey</surname><given-names>P</given-names></name>, <name><surname>Faria</surname><given-names>NR</given-names></name>, <name><surname>Rambaut</surname><given-names>A</given-names></name>, <name><surname>Shapiro</surname><given-names>B</given-names></name>, and <name><surname>Suchard</surname><given-names>MA</given-names></name> (<year>2012</year>). <article-title>Improving Bayesian Population Dynamics Inference: A Coalescent-Based Model for Multiple Loci</article-title>. <source>Mol. Biol. Evol</source>. <volume>30</volume>, <fpage>713</fpage>&#x02013;<lpage>724</lpage>.<pub-id pub-id-type="pmid">23180580</pub-id></mixed-citation></ref><ref id="R17"><label>17.</label><mixed-citation publication-type="journal"><name><surname>Gill</surname><given-names>MS</given-names></name>, <name><surname>Lemey</surname><given-names>P</given-names></name>, <name><surname>Bennett</surname><given-names>SN</given-names></name>, <name><surname>Biek</surname><given-names>R</given-names></name>, and <name><surname>Suchard</surname><given-names>MA</given-names></name> (<year>2016</year>). <article-title>Understanding Past Population Dynamics: Bayesian Coalescent-Based Modeling with Covariates</article-title>. <source>Syst. Biol</source>. <volume>65</volume>, <fpage>1041</fpage>&#x02013;<lpage>1056</lpage>.<pub-id pub-id-type="pmid">27368344</pub-id></mixed-citation></ref><ref id="R18"><label>18.</label><mixed-citation publication-type="journal"><name><surname>Susswein</surname><given-names>Z</given-names></name>, <name><surname>Rest</surname><given-names>EC</given-names></name>, and <name><surname>Bansal</surname><given-names>S</given-names></name> (<year>2022</year>). <article-title>Disentangling the rhythms of human activity in the built environment for airborne transmission risk</article-title>. <source>medRxiv</source>, <fpage>2022.04.07.22273578</fpage>.</mixed-citation></ref><ref id="R19"><label>19.</label><mixed-citation publication-type="journal"><name><surname>Kramer</surname><given-names>LD</given-names></name>, and <name><surname>Ciota</surname><given-names>AT</given-names></name> (<year>2015</year>). <article-title>Dissecting vectorial capacity for mosquito-borne viruses</article-title>. <source>Curr. Opin. Virol</source>. <volume>15</volume>, <fpage>112</fpage>&#x02013;<lpage>118</lpage>.<pub-id pub-id-type="pmid">26569343</pub-id></mixed-citation></ref><ref id="R20"><label>20.</label><mixed-citation publication-type="journal"><name><surname>Molaei</surname><given-names>G</given-names></name>, <name><surname>Thomas</surname><given-names>MC</given-names></name>, <name><surname>Muller</surname><given-names>T</given-names></name>, <name><surname>Medlock</surname><given-names>J</given-names></name>, <name><surname>Shepard</surname><given-names>JJ</given-names></name>, <name><surname>Armstrong</surname><given-names>PM</given-names></name>, and <name><surname>Andreadis</surname><given-names>TG</given-names></name> (<year>2016</year>). <article-title>Dynamics of Vector-Host Interactions in Avian Communities in Four Eastern Equine Encephalitis Virus Foci in the Northeastern U.S</article-title>. <source>PLoS Negl. Trop. Dis</source>. <volume>10</volume>, <fpage>e0004347</fpage>.<pub-id pub-id-type="pmid">26751704</pub-id></mixed-citation></ref><ref id="R21"><label>21.</label><mixed-citation publication-type="confproc"><name><surname>Nasci</surname><given-names>RS</given-names></name>, <name><surname>Doyle</surname><given-names>M</given-names></name>, <name><surname>Biggerstaff</surname><given-names>BJ</given-names></name>, and <name><surname>LeBailly</surname><given-names>A</given-names></name> (<year>2005</year>). <source>Calculation and application of a vector index (VI) reflecting the number of WN virus infected mosquitoes in a population</source>. <conf-name>71st annual meeting of the American</conf-name>.</mixed-citation></ref><ref id="R22"><label>22.</label><mixed-citation publication-type="journal"><name><surname>Fauver</surname><given-names>JR</given-names></name>, <name><surname>Pecher</surname><given-names>L</given-names></name>, <name><surname>Schurich</surname><given-names>JA</given-names></name>, <name><surname>Bolling</surname><given-names>BG</given-names></name>, <name><surname>Calhoon</surname><given-names>M</given-names></name>, <name><surname>Grubaugh</surname><given-names>ND</given-names></name>, <name><surname>Burkhalter</surname><given-names>KL</given-names></name>, <name><surname>Eisen</surname><given-names>L</given-names></name>, <name><surname>Andre</surname><given-names>BG</given-names></name>, <name><surname>Nasci</surname><given-names>RS</given-names></name>, <etal/> (<year>2016</year>). <article-title>Temporal and Spatial Variability of Entomological Risk Indices for West Nile Virus Infection in Northern Colorado: 2006&#x02013;2013</article-title>. <source>J. Med. Entomol</source>. <volume>53</volume>, <fpage>425</fpage>&#x02013;<lpage>434</lpage>.<pub-id pub-id-type="pmid">26718715</pub-id></mixed-citation></ref><ref id="R23"><label>23.</label><mixed-citation publication-type="journal"><name><surname>Obolski</surname><given-names>U</given-names></name>, <name><surname>Perez</surname><given-names>PN</given-names></name>, <name><surname>Villabona-Arenas</surname><given-names>CJ</given-names></name>, <name><surname>Th&#x000e9;z&#x000e9;</surname><given-names>J</given-names></name>, <name><surname>Faria</surname><given-names>NR</given-names></name>, and <name><surname>Louren&#x000e7;o</surname><given-names>J</given-names></name> (<year>2019</year>). <article-title>MVSE: An R-package that estimates a climate-driven mosquito-borne viral suitability index</article-title>. <source>Methods Ecol. Evol</source>. <volume>10</volume>, <fpage>1357</fpage>&#x02013;<lpage>1370</lpage>.<pub-id pub-id-type="pmid">32391139</pub-id></mixed-citation></ref><ref id="R24"><label>24.</label><mixed-citation publication-type="journal"><name><surname>Sherwood</surname><given-names>JA</given-names></name>, <name><surname>Stehman</surname><given-names>SV</given-names></name>, <name><surname>Howard</surname><given-names>JJ</given-names></name>, and <name><surname>Oliver</surname><given-names>J</given-names></name> (<year>2020</year>). <article-title>Cases of Eastern equine encephalitis in humans associated with Aedes canadensis, Coquillettidia perturbans and Culiseta melanura mosquitoes with the virus in New York State from 1971 to 2012 by analysis of aggregated published data</article-title>. <source>Epidemiol. Infect</source>. <volume>148</volume>, <fpage>e72</fpage>.<pub-id pub-id-type="pmid">32234110</pub-id></mixed-citation></ref><ref id="R25"><label>25.</label><mixed-citation publication-type="journal"><name><surname>Layan</surname><given-names>M</given-names></name>, <name><surname>M&#x000fc;ller</surname><given-names>NF</given-names></name>, <name><surname>Dellicour</surname><given-names>S</given-names></name>, <name><surname>De Maio</surname><given-names>N</given-names></name>, <name><surname>Bourhy</surname><given-names>H</given-names></name>, <name><surname>Cauchemez</surname><given-names>S</given-names></name>, and <name><surname>Baele</surname><given-names>G</given-names></name> (<year>2023</year>). <article-title>Impact and mitigation of sampling bias to determine viral spread: Evaluating discrete phylogeography through CTMC modeling and structured coalescent model approximations</article-title>. <source>Virus Evol</source>
<volume>9</volume>, <fpage>vead010</fpage>.<pub-id pub-id-type="pmid">36860641</pub-id></mixed-citation></ref><ref id="R26"><label>26.</label><mixed-citation publication-type="journal"><name><surname>Louren&#x000e7;o</surname><given-names>J</given-names></name>, <name><surname>Thompson</surname><given-names>RN</given-names></name>, <name><surname>Th&#x000e9;z&#x000e9;</surname><given-names>J</given-names></name>, and <name><surname>Obolski</surname><given-names>U</given-names></name> (<year>2020</year>). <article-title>Characterising West Nile virus epidemiology in Israel using a transmission suitability index</article-title>. <source>Euro Surveill</source>. <volume>25</volume>. <pub-id pub-id-type="doi">10.2807/1560-7917.ES.2020.25.46.1900629</pub-id>.</mixed-citation></ref><ref id="R27"><label>27.</label><mixed-citation publication-type="journal"><name><surname>Bigler</surname><given-names>WJ</given-names></name>, <name><surname>Lassing</surname><given-names>EB</given-names></name>, <name><surname>Buff</surname><given-names>EE</given-names></name>, <name><surname>Prather</surname><given-names>EC</given-names></name>, <name><surname>Beck</surname><given-names>EC</given-names></name>, and <name><surname>Hoff</surname><given-names>GL</given-names></name> (<year>1976</year>). <article-title>Endemic Eastern Equine Encephalomyelitis in Florida: A Twenty-Year Analysis, 1955&#x02013;1974</article-title>. <source>Am. J. Trop. Med. Hyg</source>. <volume>25</volume>, <fpage>884</fpage>&#x02013;<lpage>890</lpage>.<pub-id pub-id-type="pmid">12669</pub-id></mixed-citation></ref><ref id="R28"><label>28.</label><mixed-citation publication-type="journal"><name><surname>Elias</surname><given-names>SP</given-names></name>, <name><surname>Keenan</surname><given-names>P</given-names></name>, <name><surname>Kenney</surname><given-names>JL</given-names></name>, <name><surname>Morris</surname><given-names>SR</given-names></name>, <name><surname>Covino</surname><given-names>KM</given-names></name>, <name><surname>Robinson</surname><given-names>S</given-names></name>, <name><surname>Foss</surname><given-names>KA</given-names></name>, <name><surname>Rand</surname><given-names>PW</given-names></name>, <name><surname>Lubelczyk</surname><given-names>C</given-names></name>, <name><surname>Lacombe</surname><given-names>EH</given-names></name>, <etal/> (<year>2017</year>). <article-title>Seasonal Patterns in Eastern Equine Encephalitis Virus Antibody in Songbirds in Southern Maine</article-title>. <source>Vector Borne Zoonotic Dis</source>. <volume>17</volume>, <fpage>325</fpage>&#x02013;<lpage>330</lpage>.<pub-id pub-id-type="pmid">28287934</pub-id></mixed-citation></ref><ref id="R29"><label>29.</label><mixed-citation publication-type="journal"><name><surname>Dudas</surname><given-names>G</given-names></name>, <name><surname>Carvalho</surname><given-names>LM</given-names></name>, <name><surname>Rambaut</surname><given-names>A</given-names></name>, and <name><surname>Bedford</surname><given-names>T</given-names></name> (<year>2018</year>). <article-title>MERS-CoV spillover at the camel-human interface</article-title>. <source>Elife</source>
<volume>7</volume>. <pub-id pub-id-type="doi">10.7554/eLife.31257</pub-id>.</mixed-citation></ref><ref id="R30"><label>30.</label><mixed-citation publication-type="journal"><name><surname>Oliver</surname><given-names>J</given-names></name>, <name><surname>Lukacik</surname><given-names>G</given-names></name>, <name><surname>Kokas</surname><given-names>J</given-names></name>, <name><surname>Campbell</surname><given-names>SR</given-names></name>, <name><surname>Kramer</surname><given-names>LD</given-names></name>, <name><surname>Sherwood</surname><given-names>JA</given-names></name>, and <name><surname>Howard</surname><given-names>JJ</given-names></name> (<year>2018</year>). <article-title>Twenty years of surveillance for Eastern equine encephalitis virus in mosquitoes in New York State from 1993 to 2012. Parasit</article-title>. <source>Vectors</source>
<volume>11</volume>. <pub-id pub-id-type="doi">10.1186/s13071-018-2950-1</pub-id>.</mixed-citation></ref><ref id="R31"><label>31.</label><mixed-citation publication-type="journal"><name><surname>Zink</surname><given-names>SD</given-names></name>, <name><surname>Jones</surname><given-names>SA</given-names></name>, <name><surname>Maffei</surname><given-names>JG</given-names></name>, and <name><surname>Kramer</surname><given-names>LD</given-names></name> (<year>2013</year>). <article-title>Quadraplex qRT-PCR assay for the simultaneous detection of Eastern equine encephalitis virus and West Nile virus</article-title>. <source>Diagn. Microbiol. Infect. Dis</source>. <volume>77</volume>, <fpage>129</fpage>&#x02013;<lpage>132</lpage>.<pub-id pub-id-type="pmid">23891222</pub-id></mixed-citation></ref><ref id="R32"><label>32.</label><mixed-citation publication-type="journal"><name><surname>Kinsella</surname><given-names>CM</given-names></name>, <name><surname>Paras</surname><given-names>ML</given-names></name>, <name><surname>Smole</surname><given-names>S</given-names></name>, <name><surname>Mehta</surname><given-names>S</given-names></name>, <name><surname>Ganesh</surname><given-names>V</given-names></name>, <name><surname>Chen</surname><given-names>LH</given-names></name>, <name><surname>McQuillen</surname><given-names>DP</given-names></name>, <name><surname>Shah</surname><given-names>R</given-names></name>, <name><surname>Chan</surname><given-names>J</given-names></name>, <name><surname>Osborne</surname><given-names>M</given-names></name>, <etal/> (<year>2020</year>). <article-title>Jamestown Canyon virus in Massachusetts: clinical case series and vector screening</article-title>. <source>Emerg. Microbes Infect</source>. <volume>9</volume>, <fpage>903</fpage>&#x02013;<lpage>912</lpage>.<pub-id pub-id-type="pmid">32302268</pub-id></mixed-citation></ref><ref id="R33"><label>33.</label><mixed-citation publication-type="journal"><name><surname>Molaei</surname><given-names>G</given-names></name>, <name><surname>Andreadis</surname><given-names>TG</given-names></name>, <name><surname>Armstrong</surname><given-names>PM</given-names></name>, <name><surname>Thomas</surname><given-names>MC</given-names></name>, <name><surname>Deschamps</surname><given-names>T</given-names></name>, <name><surname>Cuebas-Incle</surname><given-names>E</given-names></name>, <name><surname>Montgomery</surname><given-names>W</given-names></name>, <name><surname>Osborne</surname><given-names>M</given-names></name>, <name><surname>Smole</surname><given-names>S</given-names></name>, <name><surname>Matton</surname><given-names>P</given-names></name>, <etal/> (<year>2013</year>). <article-title>Vector-host interactions and epizootiology of eastern equine encephalitis virus in Massachusetts</article-title>. <source>Vector Borne Zoonotic Dis</source>. <volume>13</volume>, <fpage>312</fpage>&#x02013;<lpage>323</lpage>.<pub-id pub-id-type="pmid">23473221</pub-id></mixed-citation></ref><ref id="R34"><label>34.</label><mixed-citation publication-type="journal"><name><surname>Petruff</surname><given-names>TA</given-names></name>, <name><surname>McMillan</surname><given-names>JR</given-names></name>, <name><surname>Shepard</surname><given-names>JJ</given-names></name>, <name><surname>Andreadis</surname><given-names>TG</given-names></name>, and <name><surname>Armstrong</surname><given-names>PM</given-names></name> (<year>2020</year>). <article-title>Increased mosquito abundance and species richness in Connecticut, United States 2001&#x02013;2019</article-title>. <source>Sci. Rep</source>. <volume>10</volume>, <fpage>1</fpage>&#x02013;<lpage>14</lpage>.<pub-id pub-id-type="pmid">31913322</pub-id></mixed-citation></ref><ref id="R35"><label>35.</label><mixed-citation publication-type="journal"><name><surname>Armstrong</surname><given-names>PM</given-names></name>, <name><surname>Andreadis</surname><given-names>TG</given-names></name>, <name><surname>Finan</surname><given-names>SL</given-names></name>, <name><surname>Shepard</surname><given-names>JJ</given-names></name>, and <name><surname>Thomas</surname><given-names>MC</given-names></name> (<year>2011</year>). <article-title>Detection of infectious virus from field-collected mosquitoes by vero cell culture assay</article-title>. <source>J. Vis. Exp</source>. <pub-id pub-id-type="doi">10.3791/2889</pub-id>.</mixed-citation></ref><ref id="R36"><label>36.</label><mixed-citation publication-type="journal"><name><surname>Armstrong</surname><given-names>PM</given-names></name>, <name><surname>Prince</surname><given-names>N</given-names></name>, and <name><surname>Andreadis</surname><given-names>TG</given-names></name> (<year>2012</year>). <article-title>Development of a multi-target TaqMan assay to detect eastern equine encephalitis virus variants in mosquitoes</article-title>. <source>Vector Borne Zoonotic Dis</source>. <volume>12</volume>, <fpage>872</fpage>&#x02013;<lpage>876</lpage>.<pub-id pub-id-type="pmid">22835151</pub-id></mixed-citation></ref><ref id="R37"><label>37.</label><mixed-citation publication-type="journal"><name><surname>Katoh</surname><given-names>K</given-names></name>, and <name><surname>Standley</surname><given-names>DM</given-names></name> (<year>2013</year>). <article-title>MAFFT Multiple Sequence Alignment Software Version 7: Improvements in Performance and Usability</article-title>. <source>Mol. Biol. Evol</source>. <volume>30</volume>, <fpage>772</fpage>.<pub-id pub-id-type="pmid">23329690</pub-id></mixed-citation></ref><ref id="R38"><label>38.</label><mixed-citation publication-type="journal"><name><surname>Minh</surname><given-names>BQ</given-names></name>, <name><surname>Schmidt</surname><given-names>HA</given-names></name>, <name><surname>Chernomor</surname><given-names>O</given-names></name>, <name><surname>Schrempf</surname><given-names>D</given-names></name>, <name><surname>Woodhams</surname><given-names>MD</given-names></name>, <name><surname>von Haeseler</surname><given-names>A</given-names></name>, and <name><surname>Lanfear</surname><given-names>R</given-names></name> (<year>2020</year>). <article-title>IQ-TREE 2: New Models and Efficient Methods for Phylogenetic Inference in the Genomic Era</article-title>. <source>Mol. Biol. Evol</source>. <volume>37</volume>, <fpage>1530</fpage>&#x02013;<lpage>1534</lpage>.<pub-id pub-id-type="pmid">32011700</pub-id></mixed-citation></ref><ref id="R39"><label>39.</label><mixed-citation publication-type="journal"><name><surname>Rambaut</surname><given-names>A</given-names></name>, <name><surname>Lam</surname><given-names>TT</given-names></name>, <name><surname>Max Carvalho</surname><given-names>L</given-names></name>, and <name><surname>Pybus</surname><given-names>OG</given-names></name> (<year>2016</year>). <article-title>Exploring the temporal structure of heterochronous sequences using TempEst (formerly Path-O-Gen)</article-title>. <source>Virus Evol</source>
<volume>2</volume>, <fpage>vew007</fpage>.<pub-id pub-id-type="pmid">27774300</pub-id></mixed-citation></ref><ref id="R40"><label>40.</label><mixed-citation publication-type="journal"><name><surname>Hill</surname><given-names>V</given-names></name>, and <name><surname>Baele</surname><given-names>G</given-names></name> (<year>2019</year>). <article-title>Bayesian estimation of past population dynamics in BEAST 1.10 using the Skygrid coalescent model</article-title>. <source>Mol. Biol. Evol</source>. <pub-id pub-id-type="doi">10.1093/molbev/msz172</pub-id>.</mixed-citation></ref><ref id="R41"><label>41.</label><mixed-citation publication-type="journal"><name><surname>Suchard</surname><given-names>MA</given-names></name>, <name><surname>Lemey</surname><given-names>P</given-names></name>, <name><surname>Baele</surname><given-names>G</given-names></name>, <name><surname>Ayres</surname><given-names>DL</given-names></name>, <name><surname>Drummond</surname><given-names>AJ</given-names></name>, and <name><surname>Rambaut</surname><given-names>A</given-names></name> (<year>2018</year>). <article-title>Bayesian phylogenetic and phylodynamic data integration using BEAST 1.10</article-title>. <source>Virus evolution</source>
<volume>4</volume>. <pub-id pub-id-type="doi">10.1093/ve/vey016</pub-id>.</mixed-citation></ref><ref id="R42"><label>42.</label><mixed-citation publication-type="journal"><name><surname>Baele</surname><given-names>G</given-names></name>, <name><surname>Gill</surname><given-names>MS</given-names></name>, <name><surname>Lemey</surname><given-names>P</given-names></name>, and <name><surname>Suchard</surname><given-names>MA</given-names></name> (<year>2020</year>). <article-title>Hamiltonian Monte Carlo sampling to estimate past population dynamics using the skygrid coalescent model in a Bayesian phylogenetics framework</article-title>. <source>Wellcome Open Research</source>
<volume>5</volume>. <pub-id pub-id-type="doi">10.12688/wellcomeopenres.15770.1</pub-id>.</mixed-citation></ref><ref id="R43"><label>43.</label><mixed-citation publication-type="journal"><name><surname>Hasegawa</surname><given-names>M</given-names></name>, <name><surname>Kishino</surname><given-names>H</given-names></name>, and <name><surname>Yano</surname><given-names>T</given-names></name> (<year>1985</year>). <article-title>Dating of the human-ape splitting by a molecular clock of mitochondrial DNA</article-title>. <source>J. Mol. Evol</source>. <volume>22</volume>, <fpage>160</fpage>&#x02013;<lpage>174</lpage>.<pub-id pub-id-type="pmid">3934395</pub-id></mixed-citation></ref><ref id="R44"><label>44.</label><mixed-citation publication-type="journal"><name><surname>Ferreira</surname><given-names>MAR</given-names></name>, and <name><surname>Suchard</surname><given-names>MA</given-names></name> (<year>2008</year>). <article-title>Bayesian analysis of elapsed times in continuous-time Markov chains</article-title>. <source>Can. J. Stat</source>. <volume>36</volume>, <fpage>355</fpage>&#x02013;<lpage>368</lpage>.</mixed-citation></ref><ref id="R45"><label>45.</label><mixed-citation publication-type="journal"><name><surname>Lemey</surname><given-names>P</given-names></name>, <name><surname>Hong</surname><given-names>SL</given-names></name>, <name><surname>Hill</surname><given-names>V</given-names></name>, <name><surname>Baele</surname><given-names>G</given-names></name>, <name><surname>Poletto</surname><given-names>C</given-names></name>, <name><surname>Colizza</surname><given-names>V</given-names></name>, <name><surname>O&#x02019;Toole</surname><given-names>&#x000c1;</given-names></name>, <name><surname>McCrone</surname><given-names>JT</given-names></name>, <name><surname>Andersen</surname><given-names>KG</given-names></name>, <name><surname>Worobey</surname><given-names>M</given-names></name>, <etal/> (<year>2020</year>). <article-title>Accommodating individual travel history and unsampled diversity in Bayesian phylogeographic inference of SARS-CoV-2</article-title>. <source>Nat. Commun</source>. <volume>11</volume>, <fpage>1</fpage>&#x02013;<lpage>14</lpage>.<pub-id pub-id-type="pmid">31911652</pub-id></mixed-citation></ref><ref id="R46"><label>46.</label><mixed-citation publication-type="journal"><name><surname>Rambaut</surname><given-names>A</given-names></name>, <name><surname>Drummond</surname><given-names>AJ</given-names></name>, <name><surname>Xie</surname><given-names>D</given-names></name>, <name><surname>Baele</surname><given-names>G</given-names></name>, and <name><surname>Suchard</surname><given-names>MA</given-names></name> (<year>2018</year>). <article-title>Posterior Summarization in Bayesian Phylogenetics Using Tracer 1.7</article-title>. <source>Syst. Biol</source>. <volume>67</volume>, <fpage>901</fpage>&#x02013;<lpage>904</lpage>.<pub-id pub-id-type="pmid">29718447</pub-id></mixed-citation></ref><ref id="R47"><label>47.</label><mixed-citation publication-type="journal"><name><surname>Yu</surname><given-names>G-Y</given-names></name>, <name><surname>Wiley</surname><given-names>MR</given-names></name>, <name><surname>Kugelman</surname><given-names>JR</given-names></name>, <name><surname>Ladner</surname><given-names>JT</given-names></name>, <name><surname>Beitzel</surname><given-names>BF</given-names></name>, <name><surname>Eccleston</surname><given-names>LT</given-names></name>, <name><surname>Morazzani</surname><given-names>EM</given-names></name>, <name><surname>Glass</surname><given-names>PJ</given-names></name>, and <name><surname>Palacios</surname><given-names>GF</given-names></name> (<year>2015</year>). <article-title>Complete Coding Sequences of Eastern Equine Encephalitis Virus and Venezuelan Equine Encephalitis Virus Strains Isolated from Human Cases</article-title>. <source>Genome Announc</source>. <volume>3</volume>. <pub-id pub-id-type="doi">10.1128/genomeA.00243-15</pub-id>.</mixed-citation></ref><ref id="R48"><label>48.</label><mixed-citation publication-type="journal"><name><surname>Cameron</surname><given-names>AC</given-names></name>, and <name><surname>Trivedi</surname><given-names>PK</given-names></name> (<year>1990</year>). <article-title>Regression-based tests for overdispersion in the Poisson model</article-title>. <source>J. Econom</source>. <volume>46</volume>, <fpage>347</fpage>&#x02013;<lpage>364</lpage>.</mixed-citation></ref><ref id="R49"><label>49.</label><mixed-citation publication-type="journal"><name><surname>Corrin</surname><given-names>T</given-names></name>, <name><surname>Ackford</surname><given-names>R</given-names></name>, <name><surname>Mascarenhas</surname><given-names>M</given-names></name>, <name><surname>Greig</surname><given-names>J</given-names></name>, and <name><surname>Waddell</surname><given-names>LA</given-names></name> (<year>2021</year>). <article-title>Eastern Equine Encephalitis Virus: A Scoping Review of the Global Evidence</article-title>. <source>Vector Borne Zoonotic Dis</source>. <volume>21</volume>, <fpage>305</fpage>&#x02013;<lpage>320</lpage>.<pub-id pub-id-type="pmid">33332203</pub-id></mixed-citation></ref><ref id="R50"><label>50.</label><mixed-citation publication-type="journal"><name><surname>Stobierski</surname><given-names>MG</given-names></name>, <name><surname>Signs</surname><given-names>K</given-names></name>, <name><surname>Dinh</surname><given-names>E</given-names></name>, <name><surname>Cooley</surname><given-names>TM</given-names></name>, <name><surname>Melotti</surname><given-names>J</given-names></name>, <name><surname>Schalow</surname><given-names>M</given-names></name>, <name><surname>Patterson</surname><given-names>JS</given-names></name>, <name><surname>Bolin</surname><given-names>SR</given-names></name>, and <name><surname>Walker</surname><given-names>ED</given-names></name> (<year>2022</year>). <article-title>Eastern Equine Encephalomyelitis in Michigan: Historical Review of Equine, Human, and Wildlife Involvement, Epidemiology, Vector Associations, and Factors Contributing to Endemicity</article-title>. <source>J. Med. Entomol</source>. <volume>59</volume>, <fpage>27</fpage>&#x02013;<lpage>40</lpage>.<pub-id pub-id-type="pmid">34734638</pub-id></mixed-citation></ref><ref id="R51"><label>51.</label><mixed-citation publication-type="journal"><name><surname>Grady</surname><given-names>GF</given-names></name>, <name><surname>Maxfield</surname><given-names>HK</given-names></name>, <name><surname>Hildreth</surname><given-names>SW</given-names></name>, <name><surname>Timperi</surname><given-names>RJ</given-names><suffix>Jr</suffix></name>, <name><surname>Gilfillan</surname><given-names>RF</given-names></name>, <name><surname>Rosenau</surname><given-names>BJ</given-names></name>, <name><surname>Francy</surname><given-names>DB</given-names></name>, <name><surname>Calisher</surname><given-names>CH</given-names></name>, <name><surname>Marcus</surname><given-names>LC</given-names></name>, and <name><surname>Madoff</surname><given-names>MA</given-names></name> (<year>1978</year>). <article-title>Eastern equine encephalitis in Massachusetts, 1957&#x02013;1976. A prospective study centered upon analyses of mosquitoes</article-title>. <source>Am. J. Epidemiol</source>. <volume>107</volume>, <fpage>170</fpage>&#x02013;<lpage>178</lpage>.<pub-id pub-id-type="pmid">23676</pub-id></mixed-citation></ref><ref id="R52"><label>52.</label><mixed-citation publication-type="journal"><name><surname>Feemster</surname><given-names>RF</given-names></name> (<year>1938</year>). <article-title>Outbreak of Encephalitis in Man Due to the Eastern Virus of Equine Encephalomyelitis</article-title>. <source>Am. J. Public Health Nations. Health</source>
<volume>28</volume>, <fpage>1403</fpage>&#x02013;<lpage>1410</lpage>.<pub-id pub-id-type="pmid">18014957</pub-id></mixed-citation></ref><ref id="R53"><label>53.</label><mixed-citation publication-type="webpage"><collab>Massachusetts Department of Public Health</collab> (<year>2022</year>). <source>Arbovirus Surveillance Plan and historical data</source>. <comment><ext-link xlink:href="https://www.mass.gov/lists/arbovirus-surveillance-plan-and-historical-data" ext-link-type="uri">https://www.mass.gov/lists/arbovirus-surveillance-plan-and-historical-data</ext-link></comment>.</mixed-citation></ref><ref id="R54"><label>54.</label><mixed-citation publication-type="journal"><name><surname>Celis-Murillo</surname><given-names>A</given-names></name>, <name><surname>Malorodova</surname><given-names>M</given-names></name>, and <name><surname>Nakash</surname><given-names>E</given-names></name> (<year>2022</year>). <source>North American Bird Banding Program Dataset 1960&#x02013;2022 retrieved 2022&#x02013;07-14</source>. <pub-id pub-id-type="doi">10.5066/P9BSM38F</pub-id>.</mixed-citation></ref></ref-list></back><floats-group><fig position="float" id="F1"><label>Figure 1 |</label><caption><title>Temporal and geographical characteristics of previous EEEV outbreaks after 2000 and context of the 2019 outbreak in Massachusetts, Connecticut, and New York.</title><p id="P88">A) Human and horse cases per year since 2000 in Massachusetts, Connecticut, and New York, colored by state. B) Human and veterinary cases in 2019 in these three states by sample date. Note that human cases are only available to the nearest month whereas veterinary cases have specific dates. C) Map showing geographical distribution of human and horse cases in 2019, shown as stars, relative to EEEV detections after 2000 in Massachusetts, Connecticut, and New York. Brown denotes counties where mosquito-positive pools have been sampled, hatched are non-human cases, and circles are human cases. D) EEEV infection rate of Culiseta melanura mosquitoes and the number tested in Massachusetts, Connecticut, and New York by year from 2000. Also see <xref rid="SD1" ref-type="supplementary-material">Figure S2</xref>.</p></caption><graphic xlink:href="nihms-1907424-f0001" position="float"/></fig><fig position="float" id="F2"><label>Figure 2 |</label><caption><title>Phylogeographic reconstruction of EEEV from 2019 and prior outbreaks</title><p id="P89">A) Number of EEEV sequences in the dataset over time by year of sampling. Note that the nationwide reporting of surveillance data began in 2003. B) Location of EEEV sequences in the dataset from Massachusetts, New York, and Connecticut to the county level. Stars indicate the location of EEEV samples which were newly sequenced for this study. C) Location of all EEEV sequences in the study to state level. D) Time-resolved phylogeny colored by location of nodes from the discrete phylogeographic analysis. States in the Northeast are colored separately, but non-Northeast and non-Florida states are grouped together. Larger tips represent EEEV sequences from 2019. E) Movement of virus from the full posterior of the discrete phylogeographic analysis. Direction is counterclockwise, and width of lines corresponds to frequency of movement across the posterior. Movements that make up fewer than 1% of the total posterior have been filtered out. Also see <xref rid="SD1" ref-type="supplementary-material">Figure S1</xref> and <xref rid="SD2" ref-type="supplementary-material">Table S1</xref>.</p></caption><graphic xlink:href="nihms-1907424-f0002" position="float"/></fig><fig position="float" id="F3"><label>Figure 3 |</label><caption><title>Detection and persistence of EEEV lineages in the Northeast</title><p id="P90">A) Time-scaled phylogeny estimating EEEV introductions into the Northeast, taking sporadic sampling into account by splitting up clusters with very long internal branches (see Methods). B) Distributions of time from introduction to first (top) and last sample (bottom) for Northeastern clusters of more than three EEEV sequences. C) Time of first node in the Northeast, first sample, and last sample for each cluster with more than three EEEV sequences, colored by state.</p></caption><graphic xlink:href="nihms-1907424-f0003" position="float"/></fig><fig position="float" id="F4"><label>Figure 4 |</label><caption><title>Phylogeographic spread of EEEV within the Northeast</title><p id="P91">A) Between-state movements from the maximum clade credibility (MCC) tree of the phylogeographic analysis within the six Northeastern EEEV clusters which have between-state movement. Width of lines relates to the number of movements, and direction is counter-clockwise. B) Maps showing sampling location to the county level for each EEEV cluster with multiple states where available. Stars indicate where there are sequences with information only at the state level (n=2 in New Hampshire, n=1 in Massachusetts and n=3 in Vermont). Corresponding subtrees are shown to the right of each map, colored by inferred location to the state level.</p></caption><graphic xlink:href="nihms-1907424-f0004" position="float"/></fig><fig position="float" id="F5"><label>Figure 5 |</label><caption><title>Model predictions of EEEV cases using mosquito infection estimates</title><p id="P92">A) Poisson regression by state of the number of EEEV positive Cs. melanura pools sampled and human and horse cases. B) Monthly trends across the year of mosquito abundance (Cs. melanura collected per trap per day), infection rate (MLE per 1000 Cs. melanura), vector index (abundance multiplied by the infection rate) and index P (modeled estimate of reproduction number), for Connecticut and Massachusetts. 2019 values are highlighted in red. C) Results of a negative binomial regression model for both Connecticut and Massachusetts combined of case risk predicted by vector index, first month of EEEV detection, index P with a 1 month lag, year, and risk compared to the month of May-July of cases in August, September, and October. The covariate for state was removed for scale, as its estimate is 11.95 (95% CI: 3.88 to 43.70) with Connecticut being the reference group. D) Actual and predicted case counts for each year based on the modeled results presented in C. Shaded areas denote error in the predicted values. E) Simulations using the previously described model. Predicted cases and intervals utilized a range of plausible vector index values and whether EEEV was detected in July or not, with index P held constant using the average value derived from the years studied for each month; and split by state. Shaded areas represent 95% confidence intervals and points are real data points from the EEEV mosquito surveillance program discussed elsewhere. Stars indicate values from 2019 and darker points indicate the actual modeled value of Index P. This model underpredicts cases when the vector index is low, as the real data points fall outside of the prediction intervals, indicating a potential lag in identification of EEEV cases. This could be due in part to stochastic chance in surveillance programs missing EEEV with low levels of virus circulation. As the vector index increases, however, our predicted values become closer to the observed data points. See also <xref rid="SD1" ref-type="supplementary-material">figures S3</xref>, <xref rid="SD1" ref-type="supplementary-material">S4</xref>, and <xref rid="SD1" ref-type="supplementary-material">S5</xref>, and <xref rid="SD1" ref-type="supplementary-material">tables S2</xref>, <xref rid="SD1" ref-type="supplementary-material">S3</xref> and <xref rid="SD1" ref-type="supplementary-material">S4</xref>.</p></caption><graphic xlink:href="nihms-1907424-f0005" position="float"/></fig><table-wrap position="float" id="T1"><table frame="box" rules="all"><colgroup span="1"><col align="left" valign="middle" span="1"/><col align="left" valign="middle" span="1"/><col align="left" valign="middle" span="1"/></colgroup><thead><tr><th align="left" valign="top" rowspan="1" colspan="1">REAGENT or RESOURCE</th><th align="left" valign="top" rowspan="1" colspan="1">SOURCE</th><th align="left" valign="top" rowspan="1" colspan="1">IDENTIFIER</th></tr></thead><tbody><tr><td colspan="3" align="left" valign="top" rowspan="1">Biological Samples</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Mosquito pools</td><td align="left" valign="top" rowspan="1" colspan="1">NYDPH, MADPH, CT agricultural research station</td><td align="left" valign="top" rowspan="1" colspan="1">N/A</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Clinical and veterinary samples</td><td align="left" valign="top" rowspan="1" colspan="1">NYDPH, MADPH, CT agricultural research station</td><td align="left" valign="top" rowspan="1" colspan="1">N/A</td></tr><tr><td colspan="3" align="left" valign="top" rowspan="1">Critical Commercial Assays</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">TaqMan<sup>&#x02122;</sup> RNA-to-C<sub>T</sub><sup>&#x02122;</sup> 1-Step Kit</td><td align="left" valign="top" rowspan="1" colspan="1">ThermoFisher Scientific</td><td align="left" valign="top" rowspan="1" colspan="1">Catalog #4392938</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Magmax Viral isolation kit</td><td align="left" valign="top" rowspan="1" colspan="1">ThermoFisher Scientific</td><td align="left" valign="top" rowspan="1" colspan="1">Catalog #A42352</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Superscript III RT-PCR with Platinum Ta1</td><td align="left" valign="top" rowspan="1" colspan="1">ThermoFisher Scientific</td><td align="left" valign="top" rowspan="1" colspan="1">Catalog #12574018</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Zymo DNA Clean and Concentrate</td><td align="left" valign="top" rowspan="1" colspan="1">Zymo Research</td><td align="left" valign="top" rowspan="1" colspan="1">Catalog #D4005</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Nextera XT kit</td><td align="left" valign="top" rowspan="1" colspan="1">Illumina</td><td align="left" valign="top" rowspan="1" colspan="1">Catalog #FC-131-1024</td></tr><tr><td colspan="3" align="left" valign="top" rowspan="1">Deposited Data</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Visual Crossing</td><td align="left" valign="top" rowspan="1" colspan="1"/><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://www.visualcrossing.com" ext-link-type="uri">https://www.visualcrossing.com</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">ArboNET</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://www.cdc.gov/mosquitoes/mosquito-control/professionals/ArboNET.html" ext-link-type="uri">https://www.cdc.gov/mosquitoes/mosquito-control/professionals/ArboNET.html</ext-link>
</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://wwwn.cdc.gov/arbonet/maps/ADB_Diseases_Map/index.html" ext-link-type="uri">https://wwwn.cdc.gov/arbonet/maps/ADB_Diseases_Map/index.html</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">North American Bird Banding Program</td><td align="left" valign="top" rowspan="1" colspan="1">Celis-Murillo, A., Malorodova, M., and Nakash, E., 2022, North American Bird Banding Program Dataset 1960&#x02013;2022 retrieved 2022-07-14: U.S. Geological Survey data release, <ext-link xlink:href="10.5066/P9BSM38F" ext-link-type="doi">https://doi.org/10.5066/P9BSM38F</ext-link>.</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://www.sciencebase.gov/catalog/item/632b2d7bd34e71c6d67bc161" ext-link-type="uri">https://www.sciencebase.gov/catalog/item/632b2d7bd34e71c6d67bc161</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Pre-existing EEEV sequencing data</td><td align="left" valign="top" rowspan="1" colspan="1">Genbank</td><td align="left" valign="top" rowspan="1" colspan="1">See <xref rid="SD1" ref-type="supplementary-material">Table S6</xref></td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Newly generated EEEV sequencing data</td><td align="left" valign="top" rowspan="1" colspan="1">Genbank</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA937726" ext-link-type="uri">https://www.ncbi.nlm.nih.gov/bioproject/PRJNA937726</ext-link>
</td></tr><tr><td colspan="3" align="left" valign="top" rowspan="1">Oligonucleotides</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">EEEV RT-PCR assay</td><td align="left" valign="top" rowspan="1" colspan="1">NYDPH</td><td align="left" valign="top" rowspan="1" colspan="1">CCCTAGTTCGATGTACTTCCG, FAM-CCGCCGATGCAGTG, GCATTATGCACTGCCCTTAGATGAAGAGCGCAGAAGACCCCY5-CAGACTCTACCGCTACGCAGACAAGGCGTCGACATTACTGTTAGC From Zink <italic toggle="yes">et al</italic><sup><xref rid="R31" ref-type="bibr">31</xref></sup></td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">EEEV primers</td><td align="left" valign="top" rowspan="1" colspan="1"/><td align="left" valign="top" rowspan="1" colspan="1">See <xref rid="SD1" ref-type="supplementary-material">Table S5</xref></td></tr><tr><td colspan="3" align="left" valign="top" rowspan="1">Software and Algorithms</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Geneious Prime version 2022.2.2.</td><td align="left" valign="top" rowspan="1" colspan="1">Dotmatics</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://www.geneious.com/" ext-link-type="uri">https://www.geneious.com/</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Mafft v 1.3.7</td><td align="left" valign="top" rowspan="1" colspan="1">Katoh <italic toggle="yes">et al</italic><sup><xref rid="R37" ref-type="bibr">37</xref></sup></td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://mafft.cbrc.jp/alignment/software/" ext-link-type="uri">https://mafft.cbrc.jp/alignment/software/</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">BEAST v1.10</td><td align="left" valign="top" rowspan="1" colspan="1">Suchard <italic toggle="yes">et al</italic><sup><xref rid="R41" ref-type="bibr">41</xref></sup></td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://beast.community/" ext-link-type="uri">https://beast.community/</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">R v4.1.2</td><td align="left" valign="top" rowspan="1" colspan="1">The R Foundation for Statistical Computing</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="http://www.R-project.org/" ext-link-type="uri">http://www.R-project.org</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">R packages (DHARMa v0.4.6, easystats, MASS, PooledInfRate v1.4)</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://cran.R-project.org/package=DHARMa" ext-link-type="uri">https://CRAN.R-project.org/package=DHARMa</ext-link>
<break/>
<ext-link xlink:href="https://easystats.github.io/easystats/" ext-link-type="uri">https://easystats.github.io/easystats/</ext-link>
<break/>
<ext-link xlink:href="https://github.com/CDCgov/PooledInfRate" ext-link-type="uri">https://github.com/CDCgov/PooledInfRate</ext-link>
</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="http://www.R-project.org/" ext-link-type="uri">http://www.R-project.org</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">IQTree v2.1.4</td><td align="left" valign="top" rowspan="1" colspan="1">Minh <italic toggle="yes">et al</italic>
<sup><xref rid="R38" ref-type="bibr">38</xref></sup></td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="http://www.iqtree.org/" ext-link-type="uri">http://www.iqtree.org/</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">Python v3.9</td><td align="left" valign="top" rowspan="1" colspan="1"/><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://www.python.org/" ext-link-type="uri">https://www.python.org/</ext-link>
</td></tr><tr><td align="left" valign="top" rowspan="1" colspan="1">DNA Lasergene v13.0</td><td align="left" valign="top" rowspan="1" colspan="1">DNA Star</td><td align="left" valign="top" rowspan="1" colspan="1">
<ext-link xlink:href="https://www.dnastar.com/software/lasergene/" ext-link-type="uri">https://www.dnastar.com/software/lasergene/</ext-link>
</td></tr></tbody></table></table-wrap><boxed-text id="BX1" position="float"><caption><title>Highlights:</title></caption><list list-type="bullet" id="L2"><list-item><p id="P93">Genomic sequencing from a large outbreak of EEEVin the northeast US in 2019</p></list-item><list-item><p id="P94">Outbreak caused by several independent short-lived virus introductions from Florida</p></list-item><list-item><p id="P95">Mosquito abundance and infection rate are predictive of human and horse cases</p></list-item><list-item><p id="P96">High-quality mosquito surveillance is vital for controlling outbreaks</p></list-item></list></boxed-text></floats-group></article>