<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">IJMR</journal-id>
      <journal-id journal-id-type="nlm-ta">Interact J Med Res</journal-id>
      <journal-title>Interactive Journal of Medical Research</journal-title>
      <issn pub-type="epub">1929-073X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v12i1e42292</article-id>
      <article-id pub-id-type="pmid">36913554</article-id>
      <article-id pub-id-type="doi">10.2196/42292</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Big Data and Infectious Disease Epidemiology: Bibliometric Analysis and Research Agenda</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wang</surname>
            <given-names>Zhongqing</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Berchialla</surname>
            <given-names>Paola</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Amusa</surname>
            <given-names>Lateef Babatunde</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Centre for Applied Data Science</institution>
            <institution>University of Johannesburg</institution>
            <addr-line>Bunting Road Campus, Auckland Park</addr-line>
            <addr-line>Johannesburg, 2006</addr-line>
            <country>South Africa</country>
            <phone>27 659904686</phone>
            <email>amusasuxes@gmail.com</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8848-1149</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Twinomurinzi</surname>
            <given-names>Hossana</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9811-3358</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Phalane</surname>
            <given-names>Edith</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6128-2337</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Phaswana-Mafuya</surname>
            <given-names>Refilwe Nancy</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9387-0432</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Centre for Applied Data Science</institution>
        <institution>University of Johannesburg</institution>
        <addr-line>Johannesburg</addr-line>
        <country>South Africa</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Statistics</institution>
        <institution>University of Ilorin</institution>
        <addr-line>Ilorin</addr-line>
        <country>Nigeria</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Pan African Centre for Epidemics Research (PACER) Extramural Unit</institution>
        <institution>South African Medical Research Council/University of Johannesburg</institution>
        <addr-line>Johannesburg</addr-line>
        <country>South Africa</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Environmental Health</institution>
        <institution>Faculty of Health Sciences</institution>
        <institution>University of Johannesburg</institution>
        <addr-line>Johannesburg</addr-line>
        <country>South Africa</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Lateef Babatunde Amusa <email>amusasuxes@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>31</day>
        <month>3</month>
        <year>2023</year>
      </pub-date>
      <volume>12</volume>
      <elocation-id>e42292</elocation-id>
      <history>
        <date date-type="received">
          <day>30</day>
          <month>8</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>10</day>
          <month>10</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>21</day>
          <month>10</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>11</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Lateef Babatunde Amusa, Hossana Twinomurinzi, Edith Phalane, Refilwe Nancy Phaswana-Mafuya. Originally published in the Interactive Journal of Medical Research (https://www.i-jmr.org/), 31.03.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Interactive Journal of Medical Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.i-jmr.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.i-jmr.org/2023/1/e42292" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Infectious diseases represent a major challenge for health systems worldwide. With the recent global pandemic of COVID-19, the need to research strategies to treat these health problems has become even more pressing. Although the literature on big data and data science in health has grown rapidly, few studies have synthesized these individual studies, and none has identified the utility of big data in infectious disease surveillance and modeling.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to synthesize research and identify hotspots of big data in infectious disease epidemiology.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Bibliometric data from 3054 documents that satisfied the inclusion criteria retrieved from the Web of Science database over 22 years (2000-2022) were analyzed and reviewed. The search retrieval occurred on October 17, 2022. Bibliometric analysis was performed to illustrate the relationships between research constituents, topics, and key terms in the retrieved documents.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The bibliometric analysis revealed internet searches and social media as the most utilized big data sources for infectious disease surveillance or modeling. The analysis also placed US and Chinese institutions as leaders in this research area. Disease monitoring and surveillance, utility of electronic health (or medical) records, methodology framework for infodemiology tools, and machine/deep learning were identified as the core research themes.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Proposals for future studies are made based on these findings. This study will provide health care informatics scholars with a comprehensive understanding of big data research in infectious disease epidemiology.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>big data</kwd>
        <kwd>bibliometrics</kwd>
        <kwd>infectious disease</kwd>
        <kwd>COVID-19</kwd>
        <kwd>disease surveillance</kwd>
        <kwd>disease</kwd>
        <kwd>pandemic</kwd>
        <kwd>data</kwd>
        <kwd>surveillance</kwd>
        <kwd>hotspot</kwd>
        <kwd>epidemiology</kwd>
        <kwd>social media</kwd>
        <kwd>utility</kwd>
        <kwd>electronic health records</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Globally, the infectious disease burden continues to be substantial in countries with low and lower-middle income, while morbidity and mortality related to neglected tropical diseases and HIV infection, tuberculosis, and malaria remain high. Tuberculosis and malaria are endemic to many areas, imposing substantial but steady burdens. At the same time, other infections such as influenza fluctuate in pervasiveness and intensity, disrupting the developing and developed settings alike when an outbreak and epidemic occurs. Additionally, deaths have persisted over the 21st century due to emerging and reemerging infectious diseases compared with seasonal and endemic infections. This portrays a new era of infectious disease, defined by outbreaks of emerging, reemerging, and endemic pathogens that spread quickly with the help of global mobility and climate change [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
      <p>Moreover, the risk from infectious diseases is globally shared. While infectious diseases thrive in underresourced settings, inequalities and inequities in accessing health and health care create a favorable environment for infectious diseases to spread [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Addressing inequalities and inequities in accessing health care, and improving surveillance and monitoring of infectious diseases should be prioritized to minimize the emergence and spread of infections.</p>
      <p>Recent years have witnessed the rapid emergence of big data and data science research, propelled by the increasing availability of digital traces [<xref ref-type="bibr" rid="ref4">4</xref>]. The growing availability of electronic records and passive data generated by social media, the internet, and other digital sources can be mined for pattern discoveries and knowledge extraction. Like most buzz words, <italic>big data</italic> has no straightforward meaning and its definition is evolving. Broadly, big data refers to a large volume of structured or unstructured data, with <italic>largeness</italic> itself associated with three major terms known as the “3 Vs”: volume (large quantity), velocity (coming in at unprecedented real-time speeds), and variety (increasing collection from different data sources). Additional characteristics of big data include veracity, validity, volatility, and value [<xref ref-type="bibr" rid="ref5">5</xref>]. For epidemiology and infectious diseases research, this means that in the last decade, there has been a significant spike in the number of studies with considerable interest in using digital epidemiology and big data tools to enhance health systems in terms of disease surveillance, modeling, and evidence-based responses [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Digital epidemiology uses digital data or online sources to gain insight into disease dynamics and health equity, and to inform public health programs and policies [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>The success of infectious disease control relies heavily on surveillance systems tracking diseases, pathogens, and clinical outcomes [<xref ref-type="bibr" rid="ref11">11</xref>]. However, conventional surveillance systems are known to frequently have severe time lags and limited spatial resolution; therefore, surveillance systems that are robust, local, and timely are critically needed. It is crucial to monitor and forecast emerging and reemerging infections [<xref ref-type="bibr" rid="ref12">12</xref>] such as severe acute respiratory syndrome, pandemic influenza, Ebola, Zika, and drug-resistant pathogens, especially in resource-limited settings such as low-middle–income countries. Using big data to strengthen surveillance systems is critical for future pandemic preparedness. This approach provides big data streams that can be triangulated with spatial and temporal data. These big data streams include digital data sources such as mobile health apps, electronic health (or medical) records, social media, internet searches, mobile phone network data, and GPS mobile data. Many studies have demonstrated the usefulness of real-time data in health assessments [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. Some of these studies have been used explicitly for the monitoring and forecasting of epidemics such as COVID-19 [<xref ref-type="bibr" rid="ref19">19</xref>], Zika [<xref ref-type="bibr" rid="ref13">13</xref>], Ebola [<xref ref-type="bibr" rid="ref16">16</xref>], and influenza [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
      <p>The body of extant literature at the nexus of big data, epidemiology, and infectious diseases is rapidly growing. However, despite its growth and dispersion, there has been a limited synthesis of the applications. A previous study [<xref ref-type="bibr" rid="ref20">20</xref>] performed a bibliometric analysis focusing on only HIV. A bibliometric analysis is a statistical or quantitative analysis of large-scale bibliographic metadata (or metrics of published studies) on a given topic. These quantitative analyses detect patterns, networks, and trends among the bibliographic metadata [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Thus, the aim of this study was to address the evolution of big data in epidemiology and infectious diseases to identify gaps and opportunities for further research. The study findings reveal interesting patterns and can inform trending research focus and future directions in big data–driven infectious diseases research.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>A bibliometric analysis was performed to understand and explore research on big data in infectious disease modeling and surveillance. The adopted bibliometric methodology involved three main phases: data collection, data analysis, and data visualization and reporting [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      </sec>
      <sec>
        <title>Search Strategy</title>
        <p>Regarding data collection, which entails querying and exporting data from selected databases, we queried the Web of Science (WoS) core databases for publications using specific inclusion and exclusion criteria. Compared to other databases, the WoS has been shown to have better quality bibliometric information [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>] and more excellent coverage of high-impact journals [<xref ref-type="bibr" rid="ref25">25</xref>]. With the aid of domain knowledge experts from the fields of both big data and epidemiology, we iteratively developed a search strategy and selected the following search terms. The following search string queried all documents’ titles, abstracts, and keywords, and generated 3235 publications in the WoS collection:</p>
        <disp-quote>
          <p>(Epidemic* OR “infectious disease*” OR “Disease surveillance” OR “disease transmission” OR “disease outbreak*” OR (“communicable disease*” NOT “non-communicable disease”) OR syndemic* OR HIV OR AIDS OR “human immunodeficiency virus” OR coronavirus* OR SARS-CoV-2 OR COVID-19 OR Influenza OR flu OR Zika OR Ebola OR MERS OR “Middle East respiratory syndrome” OR Tuberculosis OR “Monkey Pox” OR “Dengue virus” OR Hepatitis*)</p>
        </disp-quote>
        <p>
          <italic>AND</italic>
        </p>
        <disp-quote>
          <p>(“BIG DATA” OR “web mining” OR “opinion mining” OR “Google Trend*” OR “Google search*” OR “Google quer*” OR “Internet search*” OR “Internet quer*” OR “search engine quer*” OR “Digital traces” OR “electronic health records” OR “Digital epidemiology”)</p>
        </disp-quote>
      </sec>
      <sec>
        <title>Screening Strategy</title>
        <p>Documents not written in English and not peer-reviewed, including editorial materials, letters, meeting abstracts, news items, book reviews, and retracted publications, were removed from the data set given the focus on bibliometric analysis, leaving 3054 documents for the analytic sample (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flow chart of the literature selection process.</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Analysis</title>
        <p>The 3054 bibliographic data were exported into the R package <italic>bibliometrix</italic> [<xref ref-type="bibr" rid="ref23">23</xref>] for analysis. This package was specifically used to conduct performance analysis and science mapping of big data in infectious disease epidemiology. Performance mapping evaluates the production and impact of research constituents, including authors, institutions, countries, and journals. Science mapping examines the relationships between the research constituents by analyzing the topic’s conceptual, intellectual, and social structure.</p>
        <p>There are several metrics available for bibliometric analysis. In this study, the primary metrics used for evaluating productivity and influence were the H-index and M-index. The H-index represents the number of published papers <italic>h</italic>, such that the citation number is at least <italic>h</italic> [<xref ref-type="bibr" rid="ref26">26</xref>]. The H-index can be computed for different bibliometric units of analysis: authors, journals, institutions, and countries. The M-index simply adjusts the H-index for the academic age (ie, the number of years since the researcher’s first publication). Other utilized performance analysis metrics were obtained from yearly research output and citation counts. These metrics also contribute to identifying the main themes and the key actors in the research area.</p>
        <p>In terms of science mapping, network maps were constructed for some selected bibliographic units of analysis [<xref ref-type="bibr" rid="ref27">27</xref>]. These networks exhibit frequency distributions of the involved bibliographic data over time. For instance, international collaborations can be explored by assessing same-country publications. A cocitation network analysis was also used to analyze publication references. In addition, using the Louvain clustering algorithm and a greedy optimization technique [<xref ref-type="bibr" rid="ref28">28</xref>], a co-occurrence analysis was used to understand the conceptual structure of the research area. The basic purpose of co-occurrence analysis is to investigate the link between keywords based on the number of times they appear together in a publication. Notable research topics and over-time trends were detected by generating clusters for author-provided keywords [<xref ref-type="bibr" rid="ref29">29</xref>]. VOSviewer [<xref ref-type="bibr" rid="ref30">30</xref>] was used to construct the network visualizations. Each network node represents a research constituent (eg, author, country, institution, article, document source, keyword). The node’s size is proportional to the occurrence frequency of the relevant parameters. The degree of association is represented by the thickness of the link between nodes, and the various colors reflect distinct clusters.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Descriptive Summary</title>
        <p>The bibliographic data set comprises 3054 documents from 1600 sources, 14,351 authors, and 121,726 references. From the 3054 documents, 2666 (87.30%) were original research articles and the remaining 388 (12.70%) were review papers. The research output before 2009 was relatively low. The annual publication output during the 27 years (1995-2022) grew steadily, with a yearly growth rate of 26.5%. The publication growth increased steeply between 2013 and 2020 (<xref rid="figure2" ref-type="fig">Figure 2</xref>). <xref ref-type="table" rid="table1">Table 1</xref> presents the summary statistics of the primary characteristics of these 3054 publications, including the time span and information about documents and authors.</p>
        <p>As shown in <xref ref-type="table" rid="table2">Table 2</xref>, the most productive and influential sources publishing on topics related to big data and infectious diseases epidemiology were <italic>Journal of Medical Internet Research</italic> and <italic>PLoS One</italic> (H-index=18), followed by <italic>IEEE Access</italic> (H-index=13). In terms of productivity, <italic>Journal of Medical Internet Research</italic> produced a slightly higher number of publications (n=61) than the next best journal <italic>PLoS One</italic> (n=56). <italic>PLoS One</italic> had the highest number of total citations at 1893.</p>
        <p>As shown in <xref ref-type="table" rid="table3">Table 3</xref>, the most productive and influential author was Zhang Y (H-index=17), followed by Li X (H-index=13) and Wang J (H-index=12). Wang L had the highest total citations (n=1072), which was substantially higher than the next most impactful author Wang J (total citations=861).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Annual growth of publications related to big data in infectious diseases research.</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Main descriptive summary of the extracted bibliographic records from 1995 to 2022.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="630"/>
            <col width="340"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Description</td>
                <td>Results</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Time span (years)</td>
                <td>1995-2022</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Sources, n</td>
                <td>1600</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Documents, n</td>
                <td>3054</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Annual growth rate, %</td>
                <td>26.52</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Document average age (years)</td>
                <td>2.86</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Average citations per document, n</td>
                <td>18.52</td>
              </tr>
              <tr valign="top">
                <td colspan="2">References, n</td>
                <td>121,726</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Authors, n</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Total</td>
                <td>14,351</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Single-authored documents</td>
                <td>225</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Author collaborations</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Single-authored documents, n</td>
                <td>236</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Coauthors per document, n</td>
                <td>5.55</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>International coauthorships, %</td>
                <td>28.04</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Top 10 productive and influential publication sources ranked by H-index.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="330"/>
            <col width="70"/>
            <col width="80"/>
            <col width="130"/>
            <col width="120"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td>Journal</td>
                <td>Aim and scope</td>
                <td>H-index</td>
                <td>M-index</td>
                <td>Total citations, n</td>
                <td>Publications, n</td>
                <td>Publication year</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Journal of Medical Internet Research</td>
                <td>Digital health, data science, health informatics, and emerging technologies for health, medicine, and biomedical research</td>
                <td>18</td>
                <td>1.13</td>
                <td>1705</td>
                <td>61</td>
                <td>2007</td>
              </tr>
              <tr valign="top">
                <td>PLoS One</td>
                <td>Multidisciplinary</td>
                <td>18</td>
                <td>1.39</td>
                <td>1893</td>
                <td>56</td>
                <td>2010</td>
              </tr>
              <tr valign="top">
                <td>IEEE Access</td>
                <td>Multidisciplinary, comprising all IEEE fields of interest, emphasizing applications-oriented and interdisciplinary articles</td>
                <td>13</td>
                <td>1.63</td>
                <td>983</td>
                <td>32</td>
                <td>2015</td>
              </tr>
              <tr valign="top">
                <td>Scientific Reports</td>
                <td>Publishes from all areas of the natural sciences, psychology, medicine, and engineering</td>
                <td>13</td>
                <td>1.63</td>
                <td>389</td>
                <td>23</td>
                <td>2015</td>
              </tr>
              <tr valign="top">
                <td>Journal of the American Medical Informatics Association</td>
                <td>Biomedical and health informatics, including clinical care, clinical research, translational science, implementation science, imaging, education, consumer health, public health, and policy</td>
                <td>12</td>
                <td>0.86</td>
                <td>569</td>
                <td>33</td>
                <td>2009</td>
              </tr>
              <tr valign="top">
                <td>BMJ Open</td>
                <td>Medical journal considering papers in clinical medicine, public health, and epidemiology</td>
                <td>11</td>
                <td>1.10</td>
                <td>310</td>
                <td>32</td>
                <td>2013</td>
              </tr>
              <tr valign="top">
                <td>JMIR Public Health &#38; Surveillance</td>
                <td>Multidisciplinary journal with a unique focus on the intersection of innovation and technology in public health</td>
                <td>11</td>
                <td>2.20</td>
                <td>724</td>
                <td>23</td>
                <td>2018</td>
              </tr>
              <tr valign="top">
                <td>International Journal of Medical Informatics</td>
                <td>Medical informatics, including information systems and computer-aided medical support decision systems</td>
                <td>11</td>
                <td>0.65</td>
                <td>450</td>
                <td>16</td>
                <td>2006</td>
              </tr>
              <tr valign="top">
                <td>International Journal of Infectious Diseases</td>
                <td>Original clinical and laboratory-based research, together with reports of clinical trials, reviews, and some case reports dealing with the epidemiology, clinical diagnosis, treatment, and control of infectious diseases</td>
                <td>10</td>
                <td>0.91</td>
                <td>530</td>
                <td>17</td>
                <td>2012</td>
              </tr>
              <tr valign="top">
                <td>BMC Medical Informatics &#38; Decision Making</td>
                <td>Relating to the design, development, implementation, and evaluation of health information technologies and decision-making for human health</td>
                <td>10</td>
                <td>0.91</td>
                <td>208</td>
                <td>15</td>
                <td>2012</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Top 10 productive and influential authors ranked by H-index and total citations.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="290"/>
            <col width="90"/>
            <col width="90"/>
            <col width="150"/>
            <col width="140"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td>Author</td>
                <td>H-index</td>
                <td>M-index</td>
                <td>Total citations, n</td>
                <td>Publications, n</td>
                <td>Publication year</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Zhang Y</td>
                <td>17</td>
                <td>—<sup>a</sup></td>
                <td>776</td>
                <td>35</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Li X</td>
                <td>13</td>
                <td>—</td>
                <td>544</td>
                <td>35</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Wang J</td>
                <td>12</td>
                <td>1.33</td>
                <td>861</td>
                <td>24</td>
                <td>2014</td>
              </tr>
              <tr valign="top">
                <td>Wang L</td>
                <td>12</td>
                <td>—</td>
                <td>1072</td>
                <td>22</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>Wang Y</td>
                <td>10</td>
                <td>1.25</td>
                <td>342</td>
                <td>21</td>
                <td>2015</td>
              </tr>
              <tr valign="top">
                <td>Li Z</td>
                <td>10</td>
                <td>1.67</td>
                <td>366</td>
                <td>14</td>
                <td>2017</td>
              </tr>
              <tr valign="top">
                <td>Brownstein JS</td>
                <td>10</td>
                <td>0.77</td>
                <td>748</td>
                <td>11</td>
                <td>2010</td>
              </tr>
              <tr valign="top">
                <td>Wang Z</td>
                <td>9</td>
                <td>1.00</td>
                <td>427</td>
                <td>18</td>
                <td>2014</td>
              </tr>
              <tr valign="top">
                <td>Zhang W</td>
                <td>9</td>
                <td>1.13</td>
                <td>556</td>
                <td>12</td>
                <td>2015</td>
              </tr>
              <tr valign="top">
                <td>Zhang X</td>
                <td>9</td>
                <td>1.29</td>
                <td>371</td>
                <td>12</td>
                <td>2016</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Not available.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The aim and scope of the top 10 most influential journals, as listed in <xref ref-type="table" rid="table2">Table 2</xref>, is to publish medical research, medical informatics, or multidisciplinary studies. It can thus be inferred that major future breakthroughs regarding big data in infectious diseases epidemiology will likely appear in these journals.</p>
        <p><xref rid="figure3" ref-type="fig">Figure 3</xref> displays the top 20 most productive institutions. Institutional contributions were assessed by affiliations with at least one author in the publication. Except for the University of California, the top three institutions, which account for 21.3% of the number of publications in the top 20, were medical schools: Harvard Medical School (7.9%) and Icahn School of Medicine at Mount Sinai (6.4%). The other institutions, each accounting for more than 6% of the total, included Columbia University and Oxford University in the top 5, whereas others in the top 20 are research universities: London School of Hygiene and Tropical Medicine focuses on global and public health, Taipei Medical University is medical-based, and Huazhong University of Science and Technology is focused on science and technology. The United States produced the majority of the top 10 most productive institutions, which were in the top 5.</p>
        <p>The 20 most productive countries (<xref rid="figure4" ref-type="fig">Figure 4</xref>) are led by the United States and China, accounting for more than half (57.3%) of the total publication output. The United States alone accounted for 41.1% of the productivity in this field. The other countries in the top five were the United Kingdom (9.4%), India (4.4%), and Canada (3.3%).</p>
        <p>Computer science was the most productive research domain in the bibliographic collection (<xref rid="figure5" ref-type="fig">Figure 5</xref>), accounting for 17.6% of the top 10 subject areas. In order of productivity, the other research subjects in the top 5 were public environmental and occupational health (11.4%), health care services (9.6%), medical informatics (9.0%), and engineering (8.8%).</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Top 20 institutions by number of publications. CALIF: California; HARVARD MED SCH: Harvard Medical School; ICAHN SCH MED MT SINAI: Icahn School of Medicine at Mount Sinai; LONDON SCH HYG AND TROP MED: London School of Hygiene &#38; Tropical Medicine; PENN: Pennsylvania; UNIV: University.</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Top 20 productive countries by number of publications.</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Top 10 key subject areas by number of publications.</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Two major clusters of countries represent the collaboration patterns of the most productive countries (<xref rid="figure6" ref-type="fig">Figure 6</xref>). The network was set to include only countries with at least 10 documents, resulting in 50 productive countries. The clustering results demonstrated a demarcation of European countries from the others. For instance, cluster 1 (red) represented most countries from Europe, with England, Germany, and Spain being the core countries. Non-European countries constituted the second cluster (green). The United States and China were the core countries of this group.</p>
        <p>Regarding collaboration strength, the United States, with a total link strength of 570, featured the highest number of partners (48), accounting for almost all 50 countries in the network (96%). China, which distantly followed the United States, featured 38 partners and a total link strength of 304. This implies that collaboration is mainly regional.</p>
        <p><xref rid="figure7" ref-type="fig">Figure 7</xref> shows a network map of cocited references in this research area, wherein the node’s size represents the citation strength of the individual studies. The network was set to include only studies with at least 25 citations, resulting in 37 studies. Ginsberg et al [<xref ref-type="bibr" rid="ref31">31</xref>] published the most highly cited article (185 citations). This 13-year-old study presented a method that used Google search queries to track flu-like illnesses in a population. The second most cited study by Eysenbach [<xref ref-type="bibr" rid="ref9">9</xref>] introduced the concept of infodemiology, the science of using the internet (eg, social media, search engines, blogs, and websites) to inform public health and public policy. <xref ref-type="table" rid="table4">Table 4</xref> further summarizes the top 15 most cited references, including the title, year of publication, number of citations, type of disease, and data source.</p>
        <p>The 37 studies in the network map of cocited references produced four thematic clusters (<xref rid="figure7" ref-type="fig">Figure 7</xref>); disease monitoring and surveillance (cluster 1), utility of electronic health (or medical) records (cluster 2), methodology framework for infodemiology tools (cluster 3), and machine learning and deep learning methods (cluster 4) were the main topics discussed.</p>
        <p>Keyword co-occurrence analysis serves as a supplement to enrich the understanding of the thematic clusters derived from the reference cocitation analysis and helps identify the core topics and contents [<xref ref-type="bibr" rid="ref29">29</xref>]. As shown in <xref rid="figure8" ref-type="fig">Figure 8</xref>, the co-occurrence network displayed 100 relevant keywords after assigning a selection threshold of 10 for the number of keyword occurrences. The top 5 most frequently used keywords were <italic>COVID-19, big data, machine learning, coronavirus,</italic> and <italic>electronic health records.</italic></p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Network of country collaborations (≥10 documents, 50 countries, 2 clusters).</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Network of cocited references.</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Summary of the top 15 most cited references.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="360"/>
            <col width="120"/>
            <col width="120"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td>Reference</td>
                <td>Citations, n</td>
                <td>Disease</td>
                <td>Data source</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Ginsberg et al [<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                <td>185</td>
                <td>Influenza</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>Eysenbach [<xref ref-type="bibr" rid="ref9">9</xref>]</td>
                <td>74</td>
                <td>Influenza</td>
                <td>NA<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>Nuti et al [<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                <td>69</td>
                <td>NA</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>Lazer et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>67</td>
                <td>Influenza</td>
                <td>Google Flu</td>
              </tr>
              <tr valign="top">
                <td>Carneiro and Mylonaki [<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                <td>54</td>
                <td>NA</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>Zhou et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>49</td>
                <td>COVID-19</td>
                <td>Electronic health records</td>
              </tr>
              <tr valign="top">
                <td>Dong et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>49</td>
                <td>COVID-19</td>
                <td>Twitter feeds and DXY<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Polgreen et al [<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>48</td>
                <td>Influenza</td>
                <td>Yahoo searches</td>
              </tr>
              <tr valign="top">
                <td>Mavragani and Ochoa [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>43</td>
                <td>NA</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>Huang et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>42</td>
                <td>COVID-19</td>
                <td>Electronic medical records</td>
              </tr>
              <tr valign="top">
                <td>Eysenbach [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>41</td>
                <td>Influenza</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>Wu et al [<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                <td>34</td>
                <td>COVID-19</td>
                <td>Electronic medical records</td>
              </tr>
              <tr valign="top">
                <td>Li et al [<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                <td>33</td>
                <td>COVID-19</td>
                <td>Internet searches<sup>c</sup> and Weibo index<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td>Santillana et al [<xref ref-type="bibr" rid="ref43">43</xref>]</td>
                <td>31</td>
                <td>Influenza</td>
                <td>Twitter and Google Trends</td>
              </tr>
              <tr valign="top">
                <td>Signorini et al [<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                <td>30</td>
                <td>Influenza</td>
                <td>Twitter</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>NA: not applicable (eg, a review paper, no particular disease or data source for a case study).</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>Online platform of real-time COVID-19 cases in China.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>Internet searches include Google Trends and Baidu Index.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>Weibo is a China-based social media platform.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Co-occurrence networks of author keywords.</p>
          </caption>
          <graphic xlink:href="ijmr_v12i1e42292_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The 100 author-derived keywords produced four clusters from the coword analysis (<xref rid="figure8" ref-type="fig">Figure 8</xref>). Cluster 1 (yellow-green) is related to public health and infectious diseases, with top keywords such as <italic>COVID-19, SARS-CoV-2, epidemiology,</italic> and <italic>epidemics</italic>. Cluster 2 (green) is related to electronic storage and delivery of health care, with top keywords including <italic>electronic health records, clinical decision support, primary care, epidemiology,</italic> and <italic>telemedicine</italic>. Cluster 3 (blue) involves infodemiology tools, with top keywords including <italic>coronavirus, google trends, social media, infodemiology</italic>, and <italic>surveillance</italic>. Cluster 4 (red) is more coherent and broadly related to big data and artificial intelligence, including top keywords <italic>big data, machine learning, artificial intelligence, deep learning,</italic> and <italic>big data analytics.</italic></p>
      </sec>
      <sec>
        <title>Systematic Review of the Top 20 Papers</title>
        <p>Further filtering of the top 20 papers was performed to determine if they met the following criteria: (1) addressed at least one infectious disease and (2) utilized a big data source. A review of these 20 papers (summarized in <xref ref-type="table" rid="table5">Table 5</xref>) was then performed. These selected studies were mainly characterized by papers that utilized novel data sources, including internet search engine data (Google Trends: n=11; Baidu or Weibo index: n=2; Yahoo: n=1) and social media data (Twitter: n=5). Other data sources included electronic health or medical records (n=3) and Tencent migration data (n=1). The most frequently studied diseases were COVID-19 (n=10) [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref50">50</xref>], followed by influenza (n=8) [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref54">54</xref>]. Only one study considered the Zika virus [<xref ref-type="bibr" rid="ref55">55</xref>], and another considered the trio of meningitis, legionella pneumonia, and Ebola [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Summary of top 20 studies that addressed an infectious disease and utilized a big data source.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="50"/>
            <col width="90"/>
            <col width="580"/>
            <col width="160"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td>Rank</td>
                <td>Study</td>
                <td>Research objective and key findings</td>
                <td>Infectious disease(s)</td>
                <td>Big data source</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Polgreen et al [<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>Used internet search engine data for infectious diseases epidemiology and examined the relationship between Yahoo search queries for influenza and actual influenza occurrence. They estimated linear models, using searches with 1-10–week lead times as explanatory variables to predict the percentage of cultures positive for flu and deaths attributable to pneumonia and influenza in the United States. The fitted models predicted an increase in cultures positive for influenza 1-3 weeks in advance of when they occurred (<italic>P</italic>&#60;.001), and similar models predicted an increase in mortality attributable to pneumonia and influenza up to 5 weeks in advance (<italic>P</italic>&#60;.001).<break/>  <break/>  </td>
                <td>Influenza</td>
                <td>Internet search engine</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Walker et al [<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                <td>The research explored internet activity related to loss of smell in the United States and seven European countries. Spearman rank correlation was used to assess the relationship between loss-of-smell relative search volumes (RSVs), with the daily confirmed cases of COVID-19 and deaths. Strong and significant correlations (<italic>P</italic>&#60;.05) between daily RSVs related to loss of smell, daily COVID-19 cases, and deaths were found, ranging from 0.633 to 0.952.</td>
                <td>COVID-19</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Effenberger et al [<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                <td>Studied correlations between RSVs and the official COVID-19 cases reported by the European Centre for Disease Control (ECDC) for some selected countries. They opted for time-lag correlation analysis and observed a time lag of –11.5 days being the highest correlation across all investigated countries.</td>
                <td>COVID-19</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Ayyoubzadeh et al [<xref ref-type="bibr" rid="ref47">47</xref>]</td>
                <td>Opted for machine/deep learning with Google Trends data. Linear regression and long short-term memory (LSTM) models were used to estimate COVID-19 cases. They found that the linear regression model had the smaller root mean square error (RMSE) and was the better predictive model. They also found the most predictive factors of the model to be search terms of handwashing, hand sanitizer, and antiseptic topics.</td>
                <td>COVID-19</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Husnayain et al [<xref ref-type="bibr" rid="ref48">48</xref>]</td>
                <td>Considered smaller spatial coverages in their Google Trends analysis. They retrieved data from specific locations and subregions in Taiwan nationwide using defined search terms related to the coronavirus, handwashing, and face masks. Their findings suggest high to moderate correlations between RSVs and COVID-19 cases in Taipei (lag –3), New Taipei (lag –2), Taoyuan (lag –2), Tainan (lag –1), Taichung (lag 0), and Kaohsiung (lag 0).</td>
                <td>COVID-19</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Eysenbach [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>Found a strong correlation (Pearson <italic>r</italic>=0.91) between the number of clicks on a keyword-triggered link in Google with epidemiological data from Canada’s flu season of 2004-2005.</td>
                <td>Influenza</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>Yang et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>To improve the existing Google Flu Trends (GFT), they proposed an influenza tracking model, ARGO (AutoRegression with Google search data), that uses publicly available online search data. Besides having a rigorous statistical foundation, ARGO outperforms the latest GFT version. Not only does ARGO incorporate seasonality in influenza epidemics but it also captures changes in online search behavior over time.</td>
                <td>Influenza</td>
                <td>ARGO</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Cook et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>Evaluated the accuracy of each US GFT model by comparing weekly estimates of influenza-like illness (ILI) activity with the US Outpatient Influenza-like Illness Surveillance Network (ILINet). They calculated the correlation and RMSE between model estimates and ILINet for four seasons: pre-H1N1, Summer H1N1, Winter H1N1, and H1N1 overall. Both models’ estimates were highly correlated with ILINet pre-H1N1 and over the entire surveillance period, although the original model underestimated the magnitude of ILI activity during the pre-H1N1 phase. The updated model was more correlated with ILINet than the original model during Summer H1N1 (<italic>r </italic>= 0.95 and 0.29, respectively).</td>
                <td>Influenza</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Yuan et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>Used Baidu, a popular Chinese search index, to model and monitor influenza activity in China. A comprehensive technique was presented for (1) keyword selection, (2) keyword filtering, (3) index composition, and (4) modeling and detection of influenza activity in China. Sequential time series for the selected composite keyword index was significantly correlated with official Chinese influenza cases. Further, 1-month-ahead prediction of flu cases had a considerably small prediction error (mean absolute percent error&#60;11%).</td>
                <td>Influenza</td>
                <td>Baidu search index</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>Dong et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Used DXY, an online platform of the Chinese medical community, as a primary data source to develop an online interactive dashboard. The dashboard is hosted by the Center for Systems Science and Engineering (CSSE) at Johns Hopkins University, United States. They monitored various Twitter feeds, online news services, and direct communication sent through the dashboard to identify new cases.</td>
                <td>COVID-19</td>
                <td>DXY, Twitter feeds, online news services</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>Signorini et al [<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                <td>To explore public concerns regarding rapidly evolving H1N1 activity, used Twitter data and support vector regression to show that estimates of ILI accurately tracked reported disease levels. They retrieved a large sample of public tweets that matched a set of flu-related search terms.</td>
                <td>Influenza</td>
                <td>Twitter</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>Chew and Eyesenbach [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>Proposed and evaluated a complementary infoveillance approach using Twitter during the 2009 H1N1 pandemic. They performed a content analysis of tweets and validated Twitter as a real-time content and sentiment tracking tool. Infovigil, an infoveillance technology, was used to record more than 2 million Twitter postings with the terms “swine flu” and “H1N1.” According to content analysis, resource-related posts were most commonly shared (52.6%). Misinformation occurred in 4.5% of the cases. News websites were the most popular sources (23.2%), while government and health agencies were linked only 1.5% of the time.</td>
                <td>Influenza</td>
                <td>Twitter</td>
              </tr>
              <tr valign="top">
                <td>13</td>
                <td>Zhou et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>Used logistic regression models to explore the risk factors associated with in-hospital deaths. They utilized a retrospective, multicenter cohort study that included all adult inpatients with laboratory-confirmed COVID-19.</td>
                <td>COVID-19</td>
                <td>Electronic health (medical) records</td>
              </tr>
              <tr valign="top">
                <td>14</td>
                <td>Huang et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>This descriptive study detailed descriptive statistics of clinical features of patients infected with COVD-19 in China as extracted from electronic medical records.</td>
                <td>COVID-19</td>
                <td>Electronic health (medical) records</td>
              </tr>
              <tr valign="top">
                <td>15</td>
                <td>Williamson et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>Developed OpenSAFELY, a secure health analytics platform that maintains patient data in the current data center of a significant provider of primary care electronic health records and serves 40% of all patients in England. OpenSAFELY was used to examine factors associated with COVID-19–related deaths; 10,926 COVID-19–related deaths were pseudonymously linked to primary care records of 17,278,392 persons.</td>
                <td>COVID-19</td>
                <td>Electronic health (medical) records</td>
              </tr>
              <tr valign="top">
                <td>16</td>
                <td>Wu et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>Used data on monthly airline bookings from the Official Aviation Guide and data on human mobility across more than 300 prefecture-level Chinese cities from the Tencent database. The reports released by the Chinese Center for Disease Control and Prevention provided information on confirmed cases. A susceptible-exposed-infectious-recovered (SEIR) model was used to simulate the epidemics in China’s main cities. They concluded that, with a lag time of roughly 1-2 weeks behind the Wuhan outbreak, epidemics were already expanding exponentially in several large cities throughout China, assuming the transmissibility of SARS-CoV-2 was identical domestically and over time.</td>
                <td>COVID-19</td>
                <td>Tencent Migration data</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>Santillana et al [<xref ref-type="bibr" rid="ref43">43</xref>]</td>
                <td>Presented an ensemble-based machine learning method that leverages data from various sources, including Google searches, Twitter microblogs, and near real-time hospital visit records, to provide nowcast and forecast estimates of influenza activity in the United States. Their method combines multiple ILI activity estimates, generated independently with each data source, into a single prediction of ILI. Evaluation of the predictive ability of their method suggests that it outperforms every prediction using each data source independently. Additionally, it generated estimates 2 and 3 weeks ahead of time with comparable accuracy to real-time forecasts from an autoregressive model and predictions 1 week ahead of GFT’s real-time estimates.</td>
                <td>Influenza</td>
                <td>Google searches, Twitter microblogs, and near real-time hospital visit records</td>
              </tr>
              <tr valign="top">
                <td>18</td>
                <td>Li et al [<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                <td>Evaluated the predictive value of search data from Google Trends and two Chinese social media platforms, Weibo index and Baidu index, for the COVID-19 epidemic in China. They observed that the peak of internet searches and social media data about the COVID-19 outbreak occurred 10-14 days earlier than the peak of daily incidences in China. Internet searches and social media data were highly correlated (<italic>r</italic>&#62;0.89) with daily incidences.</td>
                <td>COVID-19</td>
                <td>Google Trends, Weibo index, Baidu index</td>
              </tr>
              <tr valign="top">
                <td>19</td>
                <td>Cervellin et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>Compared the reliability of Google Trends in different clinical settings for common diseases with lower media coverage and for less common diseases attracting major media coverage. They carried out a Google Trends search using the keywords “renal colic,” “epistaxis,” and “mushroom poisoning.” Additionally, a second search was carried out for three clinical conditions (ie, “meningitis,” “<italic>Legionella pneumophila</italic> pneumonia,” and “Ebola fever”). No correlation was observed between Google Trends and epidemiology of renal colics, epistaxis, and mushroom poisoning. When searching the term “mushroom” alone, the Google Trends search generated a seasonal pattern, almost overlapping with the epidemiological profile.</td>
                <td>Meningitis, <italic>Legionella</italic> pneumonia, and Ebola</td>
                <td>Google Trends</td>
              </tr>
              <tr valign="top">
                <td>20</td>
                <td>Teng et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>Developed a dynamic forecasting model for Zika virus (ZIKV) based on Google Trends. A strong correlation was found between Zika-related Google Trends and the cumulative numbers of reported cases (confirmed, suspected, and total cases <italic>P</italic>&#60;.001). Further, an autoregressive integrated moving average (ARIMA) model (0,1,3) was fitted for the dynamic estimation of ZIKV outbreaks. The forecasting results indicated that the ARIMA model, which used the online search data as the external regressor to enhance the forecasting model, is quite similar to the actual data during the Zika virus epidemic.</td>
                <td>Zika</td>
                <td>Google Trends</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Novel big data streams have created interesting opportunities for infectious disease monitoring and control. The review of the top 20 papers suggests the domination of high-volume electronic health records and digital traces such as internet searches and social media. Of note is the relatively increased use of Google Trends. Most studies used Google Trends data by correlating them with official data on disease occurrence, spread, and outbreaks. Some of these studies further adopted nowcasting for disease surveillance. However, using Google Trends for forecasts and predictions in infectious diseases epidemiology fills a gap in the extant literature. Few studies have gone as far as predicting incidents and occurrences, even though data on reported cases of various health concerns and the associated Google Trends data have been correlated in many studies. Predicting the future is hard; hence, more reliable and efficient methodologies are needed for forecasting infectious disease outbreaks.</p>
        <p>There are a few drawbacks to digital trace data that should be considered. Many of these data streams miss demographic information such as age and gender, which is essential in almost any epidemiological study. Besides, they represent a growing but still limited population segment, with infants unfeatured and fewer older adults than younger people. Geographic heterogeneity in coverage exists, with underrepresentation in developing countries, although these biases tend to fade and are arguably less pronounced than those found in traditional global surveillance systems. Further, the retrieved data are subject to spatial and temporal uncertainty. Accordingly, hybrid systems that supplement rather than replace conventional surveillance systems as well as improve prospects for accurate infectious disease models and forecasts should be developed.</p>
        <p>Most studies, except for those in the United States and China, were conducted in the European context. Thus, more studies need to test the utility of these big data streams for infectious disease epidemiology in the context of more countries, especially in Africa. Future research questions should ask if any cross-cultural differences between countries affect the adoption and use of big data in infectious disease epidemiology.</p>
        <p>The vast majority of infectious diseases have a global distribution. Apart from the coronavirus, influenza, Zika, and Ebola virus outbreaks that are featured in our review, the utility of these big data sources for more infectious diseases should be studied.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>A few limitations were inherent in our study. First, like any bibliometric study, we are limited by the search terms and database used. This study utilized English publications from the WoS core collection; therefore, relevant publications may have been missed. However, our choice of WoS was informed by its greater coverage of high-impact journals. Second, some studies may have been published after we concluded document extraction. Accordingly, this study does not claim to be exhaustive but rather extensive.</p>
      </sec>
      <sec>
        <title>Future Research Agenda and Conclusions</title>
        <p>The bibliometric study identified the United States and China as research leaders in this field, with most affiliations from the Harvard Medical School and the University of California. Top authors were Zhang Yi and Li Xingwang. <italic>Journal of Medical Internet Research</italic> and <italic>PLoS One</italic> are the most productive and influential journals in this field. Internet searches and social media data are the most utilized data sources. COVID-19 and influenza were the most studied infectious diseases. The main research themes in this area of research were disease monitoring and surveillance, utility of electronic health (or medical) records, methodology framework for infodemiology tools, and machine/deep learning. Most research papers on big data in infectious diseases epidemiology were published in outlets related to computer science, public health, and health care services.</p>
        <p>Opportunities for future research are revealed directly from the results of this study. Integrating multiple surveillance platforms, including big data tools, are critical to better understanding pathogen spread. It is also paramount for the research needs to align with a global view of disease risk. The risk of infectious disease is globally shared in an increasingly connected world. The COVID-19 pandemic, including the rapid global circulation of evolved strains, has emphasized the need for an interdisciplinary, collaborative, global framework for infectious disease research and control. There is a need to empower epidemiologists and public health scientists to leverage insights from big data for infectious disease prevention and control.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">WoS</term>
          <def>
            <p>Web of Science</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmud</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Rajeev</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rasambainarivo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rice</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tatem</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wesolowski</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Metcalf</surname>
              <given-names>CJE</given-names>
            </name>
          </person-group>
          <article-title>Infectious disease in an era of global change</article-title>
          <source>Nat Rev Microbiol</source>
          <year>2022</year>
          <month>04</month>
          <day>13</day>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>193</fpage>
          <lpage>205</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34646006"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41579-021-00639-z</pub-id>
          <pub-id pub-id-type="medline">34646006</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41579-021-00639-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC8513385</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hotez</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Globalists versus nationalists: Bridging the divide through blue marble health</article-title>
          <source>PLoS Negl Trop Dis</source>
          <year>2019</year>
          <month>07</month>
          <day>11</day>
          <volume>13</volume>
          <issue>7</issue>
          <fpage>e0007156</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pntd.0007156"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pntd.0007156</pub-id>
          <pub-id pub-id-type="medline">31295247</pub-id>
          <pub-id pub-id-type="pii">PNTD-D-19-00011</pub-id>
          <pub-id pub-id-type="pmcid">PMC6622467</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Metcalf</surname>
              <given-names>CJE</given-names>
            </name>
            <name name-style="western">
              <surname>Tatem</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bjornstad</surname>
              <given-names>ON</given-names>
            </name>
            <name name-style="western">
              <surname>Lessler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>O'Reilly</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cutts</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Grenfell</surname>
              <given-names>BT</given-names>
            </name>
          </person-group>
          <article-title>Transport networks and inequities in vaccination: remoteness shapes measles vaccine coverage and prospects for elimination across Africa</article-title>
          <source>Epidemiol Infect</source>
          <year>2015</year>
          <month>05</month>
          <volume>143</volume>
          <issue>7</issue>
          <fpage>1457</fpage>
          <lpage>1466</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25119237"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/S0950268814001988</pub-id>
          <pub-id pub-id-type="medline">25119237</pub-id>
          <pub-id pub-id-type="pii">S0950268814001988</pub-id>
          <pub-id pub-id-type="pmcid">PMC4411642</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kasson</surname>
              <given-names>PM</given-names>
            </name>
          </person-group>
          <article-title>Infectious disease research in the era of big data</article-title>
          <source>Annu Rev Biomed Data Sci</source>
          <year>2020</year>
          <month>07</month>
          <day>20</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>43</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-biodatasci-121219-025722</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <article-title>Big data</article-title>
          <source>Wikipedia</source>
          <access-date>2022-05-26</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://en.wikipedia.org/w/index.php?title=Big_data&#38;oldid=1089502025">https://en.wikipedia.org/w/index.php?title=Big_data&#38;oldid=1089502025</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hay</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Moyes</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Big data opportunities for global infectious disease surveillance</article-title>
          <source>PLoS Med</source>
          <year>2013</year>
          <month>4</month>
          <day>2</day>
          <volume>10</volume>
          <issue>4</issue>
          <fpage>e1001413</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pmed.1001413"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pmed.1001413</pub-id>
          <pub-id pub-id-type="medline">23565065</pub-id>
          <pub-id pub-id-type="pii">PMEDICINE-D-12-02464</pub-id>
          <pub-id pub-id-type="pmcid">PMC3614504</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Milinovich</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Soares Magalhães</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Role of big data in the early detection of Ebola and other emerging infectious diseases</article-title>
          <source>Lancet Glob Health</source>
          <year>2015</year>
          <month>01</month>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>e20</fpage>
          <lpage>e21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-109X(14)70356-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2214-109X(14)70356-0</pub-id>
          <pub-id pub-id-type="medline">25539964</pub-id>
          <pub-id pub-id-type="pii">S2214-109X(14)70356-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence for infectious disease big data analytics</article-title>
          <source>Infect Dis Health</source>
          <year>2019</year>
          <month>02</month>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>44</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.1016/j.idh.2018.10.002</pub-id>
          <pub-id pub-id-type="medline">30541697</pub-id>
          <pub-id pub-id-type="pii">S2468-0451(18)30144-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the Internet</article-title>
          <source>J Med Internet Res</source>
          <year>2009</year>
          <month>03</month>
          <day>27</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>e11</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2009/1/e11/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
          <pub-id pub-id-type="medline">19329408</pub-id>
          <pub-id pub-id-type="pii">v11i1e11</pub-id>
          <pub-id pub-id-type="pmcid">PMC2762766</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salathé</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Digital epidemiology: what is it, and where is it going?</article-title>
          <source>Life Sci Soc Policy</source>
          <year>2018</year>
          <month>01</month>
          <day>04</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29302758"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40504-017-0065-7</pub-id>
          <pub-id pub-id-type="medline">29302758</pub-id>
          <pub-id pub-id-type="pii">10.1186/s40504-017-0065-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5754279</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thacker</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Stroup</surname>
              <given-names>DF</given-names>
            </name>
          </person-group>
          <article-title>Future directions for comprehensive public health surveillance and health information systems in the United States</article-title>
          <source>Am J Epidemiol</source>
          <year>1994</year>
          <month>09</month>
          <day>01</day>
          <volume>140</volume>
          <issue>5</issue>
          <fpage>383</fpage>
          <lpage>397</lpage>
          <pub-id pub-id-type="doi">10.1093/oxfordjournals.aje.a117261</pub-id>
          <pub-id pub-id-type="medline">8067331</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woolhouse</surname>
              <given-names>MEJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rambaut</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kellam</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Lessons from Ebola: Improving infectious disease surveillance to inform outbreak management</article-title>
          <source>Sci Transl Med</source>
          <year>2015</year>
          <month>09</month>
          <day>30</day>
          <volume>7</volume>
          <issue>307</issue>
          <fpage>307rv5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26424572"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/scitranslmed.aab0191</pub-id>
          <pub-id pub-id-type="medline">26424572</pub-id>
          <pub-id pub-id-type="pii">7/307/307rv5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5819730</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farhadloo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Winneg</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Hall Jamieson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Albarracin</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Associations of topics of discussion on Twitter with survey measures of attitudes, knowledge, and behaviors related to Zika: probabilistic study in the United States</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2018</year>
          <month>02</month>
          <day>09</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>e16</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2018/1/e16/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.8186</pub-id>
          <pub-id pub-id-type="medline">29426815</pub-id>
          <pub-id pub-id-type="pii">v4i1e16</pub-id>
          <pub-id pub-id-type="pmcid">PMC5889815</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Baltrusaitis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leskovec</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sosic</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hawkins</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Conidi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gunn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zink</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Santillana</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Accurate influenza monitoring and forecasting using novel internet data streams: a case study in the Boston metropolis</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2018</year>
          <month>01</month>
          <day>09</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>e4</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2018/1/e4/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.8950</pub-id>
          <pub-id pub-id-type="medline">29317382</pub-id>
          <pub-id pub-id-type="pii">v4i1e4</pub-id>
          <pub-id pub-id-type="pmcid">PMC5780615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mavragani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sampri</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sypsa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tsagarakis</surname>
              <given-names>KP</given-names>
            </name>
          </person-group>
          <article-title>Integrating smart health in the US health care system: infodemiology study of asthma monitoring in the Google era</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2018</year>
          <month>03</month>
          <day>12</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>e24</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2018/1/e24/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.8726</pub-id>
          <pub-id pub-id-type="medline">29530839</pub-id>
          <pub-id pub-id-type="pii">v4i1e24</pub-id>
          <pub-id pub-id-type="pmcid">PMC5869181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Lent</surname>
              <given-names>LG</given-names>
            </name>
            <name name-style="western">
              <surname>Sungur</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kunneman</surname>
              <given-names>FA</given-names>
            </name>
            <name name-style="western">
              <surname>van de Velde</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Too far to care? Measuring public attention and fear for Ebola using Twitter</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>06</month>
          <day>13</day>
          <volume>19</volume>
          <issue>6</issue>
          <fpage>e193</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/6/e193/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7219</pub-id>
          <pub-id pub-id-type="medline">28611015</pub-id>
          <pub-id pub-id-type="pii">v19i6e193</pub-id>
          <pub-id pub-id-type="pmcid">PMC5487741</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wongkoblap</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vadillo</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Researching mental health disorders in the era of social media: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>06</month>
          <day>29</day>
          <volume>19</volume>
          <issue>6</issue>
          <fpage>e228</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/6/e228/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7215</pub-id>
          <pub-id pub-id-type="medline">28663166</pub-id>
          <pub-id pub-id-type="pii">v19i6e228</pub-id>
          <pub-id pub-id-type="pmcid">PMC5509952</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Detecting lung cancer trends by leveraging real-world and internet-based data: infodemiology study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>03</month>
          <day>12</day>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>e16184</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/3/e16184/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/16184</pub-id>
          <pub-id pub-id-type="medline">32163035</pub-id>
          <pub-id pub-id-type="pii">v22i3e16184</pub-id>
          <pub-id pub-id-type="pmcid">PMC7099398</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mavragani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gkillas</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 predictability in the United States using Google Trends time series</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>11</month>
          <day>26</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>20693</fpage>
          <pub-id pub-id-type="doi">10.1038/s41598-020-77275-9</pub-id>
          <pub-id pub-id-type="medline">33244028</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-77275-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7692493</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Qiao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Olatosi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lyu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Emergence and evolution of big data science in HIV research: Bibliometric analysis of federally sponsored studies 2000-2019</article-title>
          <source>Int J Med Inform</source>
          <year>2021</year>
          <month>10</month>
          <volume>154</volume>
          <fpage>104558</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34481301"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2021.104558</pub-id>
          <pub-id pub-id-type="medline">34481301</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(21)00184-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8529625</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Loebbecke</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Engaging scientometrics in information systems</article-title>
          <source>J Inf Technol</source>
          <year>2017</year>
          <month>03</month>
          <day>01</day>
          <volume>32</volume>
          <issue>1</issue>
          <fpage>85</fpage>
          <lpage>109</lpage>
          <pub-id pub-id-type="doi">10.1057/jit.2015.29</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Visualizing a field of research: a methodology of systematic scientometric reviews</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <month>10</month>
          <day>31</day>
          <volume>14</volume>
          <issue>10</issue>
          <fpage>e0223994</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0223994"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0223994</pub-id>
          <pub-id pub-id-type="medline">31671124</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-16569</pub-id>
          <pub-id pub-id-type="pmcid">PMC6822756</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aria</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cuccurullo</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>bibliometrix : An R-tool for comprehensive science mapping analysis</article-title>
          <source>J Informetr</source>
          <year>2017</year>
          <month>11</month>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>959</fpage>
          <lpage>975</lpage>
          <pub-id pub-id-type="doi">10.1016/j.joi.2017.08.007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Porter</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Discovering and forecasting interactions in big data research: a learning-enhanced bibliometric study</article-title>
          <source>Technol Forecast Soc Change</source>
          <year>2019</year>
          <month>09</month>
          <volume>146</volume>
          <fpage>795</fpage>
          <lpage>807</lpage>
          <pub-id pub-id-type="doi">10.1016/j.techfore.2018.06.007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harzing</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alakangas</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Google Scholar, Scopus and the Web of Science: a longitudinal and cross-disciplinary comparison</article-title>
          <source>Scientometrics</source>
          <year>2015</year>
          <month>11</month>
          <day>26</day>
          <volume>106</volume>
          <issue>2</issue>
          <fpage>787</fpage>
          <lpage>804</lpage>
          <pub-id pub-id-type="doi">10.1007/s11192-015-1798-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirsch</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>An index to quantify an individual’s scientific research output that takes into account the effect of multiple coauthorship</article-title>
          <source>Scientometrics</source>
          <year>2010</year>
          <month>3</month>
          <day>13</day>
          <volume>85</volume>
          <issue>3</issue>
          <fpage>741</fpage>
          <lpage>754</lpage>
          <pub-id pub-id-type="doi">10.1007/s11192-010-0193-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Batagelj</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Cerinšek</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>On bibliographic networks</article-title>
          <source>Scientometrics</source>
          <year>2013</year>
          <month>1</month>
          <day>20</day>
          <volume>96</volume>
          <issue>3</issue>
          <fpage>845</fpage>
          <lpage>864</lpage>
          <pub-id pub-id-type="doi">10.1007/s11192-012-0940-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>VD</given-names>
            </name>
            <name name-style="western">
              <surname>Guillaume</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Lambiotte</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lefebvre</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Fast unfolding of communities in large networks</article-title>
          <source>J Stat Mech Theory Exp</source>
          <year>2008</year>
          <volume>10</volume>
          <fpage>P10008</fpage>
          <pub-id pub-id-type="doi">10.1088/1742-5468/2008/10/P10008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Su</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Mapping knowledge structure by keyword co-occurrence: a first look at journal papers in Technology Foresight</article-title>
          <source>Scientometrics</source>
          <year>2010</year>
          <month>6</month>
          <day>22</day>
          <volume>85</volume>
          <issue>1</issue>
          <fpage>65</fpage>
          <lpage>79</lpage>
          <pub-id pub-id-type="doi">10.1007/s11192-010-0259-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Eck</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Waltman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Software survey: VOSviewer, a computer program for bibliometric mapping</article-title>
          <source>Scientometrics</source>
          <year>2010</year>
          <month>08</month>
          <day>31</day>
          <volume>84</volume>
          <issue>2</issue>
          <fpage>523</fpage>
          <lpage>538</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20585380"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11192-009-0146-3</pub-id>
          <pub-id pub-id-type="medline">20585380</pub-id>
          <pub-id pub-id-type="pmcid">PMC2883932</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ginsberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mohebbi</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Brammer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Smolinski</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Brilliant</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Detecting influenza epidemics using search engine query data</article-title>
          <source>Nature</source>
          <year>2009</year>
          <month>02</month>
          <day>19</day>
          <volume>457</volume>
          <issue>7232</issue>
          <fpage>1012</fpage>
          <lpage>1014</lpage>
          <pub-id pub-id-type="doi">10.1038/nature07634</pub-id>
          <pub-id pub-id-type="medline">19020500</pub-id>
          <pub-id pub-id-type="pii">nature07634</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nuti</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Wayda</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ranasinghe</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>Murugiah</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The use of google trends in health care research: a systematic review</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <month>10</month>
          <day>22</day>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>e109583</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0109583"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0109583</pub-id>
          <pub-id pub-id-type="medline">25337815</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-22976</pub-id>
          <pub-id pub-id-type="pmcid">PMC4215636</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lazer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kennedy</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Vespignani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Big data. The parable of Google Flu: traps in big data analysis</article-title>
          <source>Science</source>
          <year>2014</year>
          <month>03</month>
          <day>14</day>
          <volume>343</volume>
          <issue>6176</issue>
          <fpage>1203</fpage>
          <lpage>1205</lpage>
          <pub-id pub-id-type="doi">10.1126/science.1248506</pub-id>
          <pub-id pub-id-type="medline">24626916</pub-id>
          <pub-id pub-id-type="pii">343/6176/1203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carneiro</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mylonakis</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Google trends: a web-based tool for real-time surveillance of disease outbreaks</article-title>
          <source>Clin Infect Dis</source>
          <year>2009</year>
          <month>11</month>
          <day>15</day>
          <volume>49</volume>
          <issue>10</issue>
          <fpage>1557</fpage>
          <lpage>1564</lpage>
          <pub-id pub-id-type="doi">10.1086/630200</pub-id>
          <pub-id pub-id-type="medline">19845471</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Clinical course and risk factors for mortality of adult inpatients with COVID-19 in Wuhan, China: a retrospective cohort study</article-title>
          <source>Lancet</source>
          <year>2020</year>
          <month>03</month>
          <day>28</day>
          <volume>395</volume>
          <issue>10229</issue>
          <fpage>1054</fpage>
          <lpage>1062</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32171076"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)30566-3</pub-id>
          <pub-id pub-id-type="medline">32171076</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)30566-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7270627</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>An interactive web-based dashboard to track COVID-19 in real time</article-title>
          <source>Lancet Infect Dis</source>
          <year>2020</year>
          <month>05</month>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>533</fpage>
          <lpage>534</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32087114"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="medline">32087114</pub-id>
          <pub-id pub-id-type="pii">S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7159018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Polgreen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pennock</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Using internet searches for influenza surveillance</article-title>
          <source>Clin Infect Dis</source>
          <year>2008</year>
          <month>12</month>
          <day>01</day>
          <volume>47</volume>
          <issue>11</issue>
          <fpage>1443</fpage>
          <lpage>1448</lpage>
          <pub-id pub-id-type="doi">10.1086/593098</pub-id>
          <pub-id pub-id-type="medline">18954267</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mavragani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ochoa</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Google trends in infodemiology and infoveillance: methodology framework</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2019</year>
          <month>05</month>
          <day>29</day>
          <volume>5</volume>
          <issue>2</issue>
          <fpage>e13439</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2019/2/e13439/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13439</pub-id>
          <pub-id pub-id-type="medline">31144671</pub-id>
          <pub-id pub-id-type="pii">v5i2e13439</pub-id>
          <pub-id pub-id-type="pmcid">PMC6660120</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Clinical features of patients infected with 2019 novel coronavirus in Wuhan, China</article-title>
          <source>Lancet</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>395</volume>
          <issue>10223</issue>
          <fpage>497</fpage>
          <lpage>506</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0140-6736(20)30183-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)30183-5</pub-id>
          <pub-id pub-id-type="medline">31986264</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)30183-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7159299</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology: tracking flu-related searches on the web for syndromic surveillance</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2006</year>
          <volume>2006</volume>
          <fpage>244</fpage>
          <lpage>248</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/17238340"/>
          </comment>
          <pub-id pub-id-type="medline">17238340</pub-id>
          <pub-id pub-id-type="pii">86095</pub-id>
          <pub-id pub-id-type="pmcid">PMC1839505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>McGoogan</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Characteristics of and important lessons from the coronavirus disease 2019 (COVID-19) outbreak in China: summary of a report of 72 314 cases from the Chinese Center for Disease Control and Prevention</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>04</month>
          <day>07</day>
          <volume>323</volume>
          <issue>13</issue>
          <fpage>1239</fpage>
          <lpage>1242</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2020.2648</pub-id>
          <pub-id pub-id-type="medline">32091533</pub-id>
          <pub-id pub-id-type="pii">2762130</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Retrospective analysis of the possibility of predicting the COVID-19 outbreak from Internet searches and social media data, China, 2020</article-title>
          <source>Euro Surveill</source>
          <year>2020</year>
          <month>03</month>
          <volume>25</volume>
          <issue>10</issue>
          <fpage>2000199</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.eurosurveillance.org/content/10.2807/1560-7917.ES.2020.25.10.2000199"/>
          </comment>
          <pub-id pub-id-type="doi">10.2807/1560-7917.ES.2020.25.10.2000199</pub-id>
          <pub-id pub-id-type="medline">32183935</pub-id>
          <pub-id pub-id-type="pmcid">PMC7078825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Santillana</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Nsoesie</surname>
              <given-names>EO</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Combining search, social media, and traditional data sources to improve influenza surveillance</article-title>
          <source>PLoS Comput Biol</source>
          <year>2015</year>
          <month>10</month>
          <day>29</day>
          <volume>11</volume>
          <issue>10</issue>
          <fpage>e1004513</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pcbi.1004513"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pcbi.1004513</pub-id>
          <pub-id pub-id-type="medline">26513245</pub-id>
          <pub-id pub-id-type="pii">PCOMPBIOL-D-15-00856</pub-id>
          <pub-id pub-id-type="pmcid">PMC4626021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Signorini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Segre</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Polgreen</surname>
              <given-names>PM</given-names>
            </name>
          </person-group>
          <article-title>The use of Twitter to track levels of disease activity and public concern in the U.S. during the influenza A H1N1 pandemic</article-title>
          <source>PLoS One</source>
          <year>2011</year>
          <month>05</month>
          <day>04</day>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>e19467</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0019467"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0019467</pub-id>
          <pub-id pub-id-type="medline">21573238</pub-id>
          <pub-id pub-id-type="pii">PONE-D-10-02464</pub-id>
          <pub-id pub-id-type="pmcid">PMC3087759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Surda</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Use of Google Trends to investigate loss-of-smell-related searches during the COVID-19 outbreak</article-title>
          <source>Int Forum Allergy Rhinol</source>
          <year>2020</year>
          <month>07</month>
          <day>15</day>
          <volume>10</volume>
          <issue>7</issue>
          <fpage>839</fpage>
          <lpage>847</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32279437"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/alr.22580</pub-id>
          <pub-id pub-id-type="medline">32279437</pub-id>
          <pub-id pub-id-type="pmcid">PMC7262261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Effenberger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kronbichler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tilg</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Perco</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Association of the COVID-19 pandemic with Internet Search Volumes: A Google Trends Analysis</article-title>
          <source>Int J Infect Dis</source>
          <year>2020</year>
          <month>06</month>
          <volume>95</volume>
          <fpage>192</fpage>
          <lpage>197</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1201-9712(20)30249-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijid.2020.04.033</pub-id>
          <pub-id pub-id-type="medline">32305520</pub-id>
          <pub-id pub-id-type="pii">S1201-9712(20)30249-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7162745</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayyoubzadeh</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Ayyoubzadeh</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Zahedi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmadi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>R Niakan Kalhori</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Predicting COVID-19 incidence through analysis of Google Trends data in Iran: data mining and deep learning pilot study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <month>04</month>
          <day>14</day>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>e18828</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/2/e18828/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18828</pub-id>
          <pub-id pub-id-type="medline">32234709</pub-id>
          <pub-id pub-id-type="pii">v6i2e18828</pub-id>
          <pub-id pub-id-type="pmcid">PMC7159058</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Husnayain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fuad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>EC</given-names>
            </name>
          </person-group>
          <article-title>Applications of Google Search Trends for risk communication in infectious disease management: a case study of the COVID-19 outbreak in Taiwan</article-title>
          <source>Int J Infect Dis</source>
          <year>2020</year>
          <month>06</month>
          <volume>95</volume>
          <fpage>221</fpage>
          <lpage>223</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1201-9712(20)30140-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijid.2020.03.021</pub-id>
          <pub-id pub-id-type="medline">32173572</pub-id>
          <pub-id pub-id-type="pii">S1201-9712(20)30140-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7270523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Williamson</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bhaskaran</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bacon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bates</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Morton</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrkar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Inglesby</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cockburn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>HI</given-names>
            </name>
            <name name-style="western">
              <surname>MacKenna</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tomlinson</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Douglas</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rentsch</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Mathur</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>AYS</given-names>
            </name>
            <name name-style="western">
              <surname>Grieve</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Forbes</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Schultze</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Croker</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Parry</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hester</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Harper</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Perera</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>SJW</given-names>
            </name>
            <name name-style="western">
              <surname>Smeeth</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Goldacre</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Factors associated with COVID-19-related death using OpenSAFELY</article-title>
          <source>Nature</source>
          <year>2020</year>
          <month>08</month>
          <day>08</day>
          <volume>584</volume>
          <issue>7821</issue>
          <fpage>430</fpage>
          <lpage>436</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32640463"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-020-2521-4</pub-id>
          <pub-id pub-id-type="medline">32640463</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-020-2521-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC7611074</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Leung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Leung</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Nowcasting and forecasting the potential domestic and international spread of the 2019-nCoV outbreak originating in Wuhan, China: a modelling study</article-title>
          <source>Lancet</source>
          <year>2020</year>
          <month>02</month>
          <day>29</day>
          <volume>395</volume>
          <issue>10225</issue>
          <fpage>689</fpage>
          <lpage>697</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32014114"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)30260-9</pub-id>
          <pub-id pub-id-type="medline">32014114</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)30260-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7159271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Santillana</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kou</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>Accurate estimation of influenza epidemics using Google search data via ARGO</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2015</year>
          <month>11</month>
          <day>24</day>
          <volume>112</volume>
          <issue>47</issue>
          <fpage>14473</fpage>
          <lpage>14478</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26553980"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.1515373112</pub-id>
          <pub-id pub-id-type="medline">26553980</pub-id>
          <pub-id pub-id-type="pii">1515373112</pub-id>
          <pub-id pub-id-type="pmcid">PMC4664296</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Conrad</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fowlkes</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Mohebbi</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Assessing Google flu trends performance in the United States during the 2009 influenza virus A (H1N1) pandemic</article-title>
          <source>PLoS One</source>
          <year>2011</year>
          <month>8</month>
          <day>19</day>
          <volume>6</volume>
          <issue>8</issue>
          <fpage>e23610</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0023610"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0023610</pub-id>
          <pub-id pub-id-type="medline">21886802</pub-id>
          <pub-id pub-id-type="pii">PONE-D-11-06712</pub-id>
          <pub-id pub-id-type="pmcid">PMC3158788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Nsoesie</surname>
              <given-names>EO</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chunara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Monitoring influenza epidemics in china with search query from baidu</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <month>5</month>
          <day>30</day>
          <volume>8</volume>
          <issue>5</issue>
          <fpage>e64323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0064323"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0064323</pub-id>
          <pub-id pub-id-type="medline">23750192</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-00331</pub-id>
          <pub-id pub-id-type="pmcid">PMC3667820</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chew</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Pandemics in the age of Twitter: content analysis of Tweets during the 2009 H1N1 outbreak</article-title>
          <source>PLoS One</source>
          <year>2010</year>
          <month>11</month>
          <day>29</day>
          <volume>5</volume>
          <issue>11</issue>
          <fpage>e14118</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0014118"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0014118</pub-id>
          <pub-id pub-id-type="medline">21124761</pub-id>
          <pub-id pub-id-type="pmcid">PMC2993925</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Teng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Dynamic forecasting of Zika epidemics using Google Trends</article-title>
          <source>PLoS One</source>
          <year>2017</year>
          <month>1</month>
          <day>6</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>e0165085</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0165085"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0165085</pub-id>
          <pub-id pub-id-type="medline">28060809</pub-id>
          <pub-id pub-id-type="pii">PONE-D-16-40369</pub-id>
          <pub-id pub-id-type="pmcid">PMC5217860</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cervellin</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Comelli</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lippi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Is Google Trends a reliable tool for digital epidemiology? Insights from different clinical settings</article-title>
          <source>J Epidemiol Glob Health</source>
          <year>2017</year>
          <month>09</month>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>185</fpage>
          <lpage>189</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2210-6006(17)30109-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jegh.2017.06.001</pub-id>
          <pub-id pub-id-type="medline">28756828</pub-id>
          <pub-id pub-id-type="pii">S2210-6006(17)30109-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7320449</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
