<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Infodemiology</journal-id>
      <journal-title>JMIR Infodemiology</journal-title>
      <issn pub-type="epub">2564-1891</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v2i2e35121</article-id>
      <article-id pub-id-type="pmid">36348981</article-id>
      <article-id pub-id-type="doi">10.2196/35121</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Quantifying Changes in Vaccine Coverage in Mainstream Media as a Result of the COVID-19 Outbreak: Text Mining Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mackey</surname>
            <given-names>Tim</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Williams</surname>
            <given-names>Christopher</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Luo</surname>
            <given-names>Jiebo</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Christensen</surname>
            <given-names>Bente</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2013-3559</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Laydon</surname>
            <given-names>Daniel</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4270-3321</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Chelkowski</surname>
            <given-names>Tadeusz</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0297-3650</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Jemielniak</surname>
            <given-names>Dariusz</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3745-7931</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Vollmer</surname>
            <given-names>Michaela</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6970-7192</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Bhatt</surname>
            <given-names>Samir</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0891-4611</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Krawczyk</surname>
            <given-names>Konrad</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Mathematics and Computer Science</institution>
            <institution>University of Southern Denmark</institution>
            <addr-line>Campusvej 55</addr-line>
            <addr-line>Odense, 5230</addr-line>
            <country>Denmark</country>
            <phone>45 5551122</phone>
            <email>konradk@imada.sdu.dk</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0697-5522</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Mathematics and Computer Science</institution>
        <institution>University of Southern Denmark</institution>
        <addr-line>Odense</addr-line>
        <country>Denmark</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Infectious Disease Epidemiology</institution>
        <institution>MRC Centre for Global Infectious Disease Analysis</institution>
        <institution>Imperial College London</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Management in the Network Society</institution>
        <institution>Kozminski University</institution>
        <addr-line>Warsaw</addr-line>
        <country>Poland</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Section of Epidemiology</institution>
        <institution>Department of Public Health</institution>
        <institution>University of Copenhagen</institution>
        <addr-line>Copenhagen</addr-line>
        <country>Denmark</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Konrad Krawczyk <email>konradk@imada.sdu.dk</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jul-Dec</season>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>20</day>
        <month>9</month>
        <year>2022</year>
      </pub-date>
      <volume>2</volume>
      <issue>2</issue>
      <elocation-id>e35121</elocation-id>
      <history>
        <date date-type="received">
          <day>22</day>
          <month>11</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>30</day>
          <month>12</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>25</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>19</day>
          <month>7</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Bente Christensen, Daniel Laydon, Tadeusz Chelkowski, Dariusz Jemielniak, Michaela Vollmer, Samir Bhatt, Konrad Krawczyk. Originally published in JMIR Infodemiology (https://infodemiology.jmir.org), 20.09.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Infodemiology, is properly cited. The complete bibliographic information, a link to the original publication on https://infodemiology.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://infodemiology.jmir.org/2022/2/e35121" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Achieving herd immunity through vaccination depends upon the public’s acceptance, which in turn relies on their understanding of its risks and benefits. The fundamental objective of public health messaging on vaccines is therefore the clear communication of often complex information and, increasingly, the countering of misinformation. The primary outlet shaping public understanding is mainstream online news media, where coverage of COVID-19 vaccines was widespread.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We used text-mining analysis on the front pages of mainstream online news to quantify the volume and sentiment polarization of vaccine coverage.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We analyzed 28 million articles from 172 major news sources across 11 countries between July 2015 and April 2021. We employed keyword-based frequency analysis to estimate the proportion of overall articles devoted to vaccines. We performed topic detection using BERTopic and named entity recognition to identify the leading subjects and actors mentioned in the context of vaccines. We used the Vader Python module to perform sentiment polarization quantification of all collated English-language articles.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The proportion of front-page articles mentioning vaccines increased from 0.1% to 4% with the outbreak of COVID-19. The number of negatively polarized articles increased from 6698 in 2015-2019 to 28,552 in 2020-2021. However, overall vaccine coverage before the COVID-19 pandemic was slightly negatively polarized (57% negative), whereas coverage during the pandemic was positively polarized (38% negative).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Throughout the pandemic, vaccines have risen from a marginal to a widely discussed topic on the front pages of major news outlets. Mainstream online media has been positively polarized toward vaccines, compared with mainly negative prepandemic vaccine news. However, the pandemic was accompanied by an order-of-magnitude increase in vaccine news that, due to low prepandemic frequency, may contribute to a perceived negative sentiment. These results highlight important interactions between the volume of news and overall polarization. To the best of our knowledge, our work is the first systematic text mining study of front-page vaccine news headlines in the context of COVID-19.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>data mining</kwd>
        <kwd>COVID-19</kwd>
        <kwd>vaccine</kwd>
        <kwd>text mining</kwd>
        <kwd>change</kwd>
        <kwd>coverage</kwd>
        <kwd>communication</kwd>
        <kwd>media</kwd>
        <kwd>social media</kwd>
        <kwd>news</kwd>
        <kwd>outbreak</kwd>
        <kwd>acceptance</kwd>
        <kwd>hesitancy</kwd>
        <kwd>understanding</kwd>
        <kwd>knowledge</kwd>
        <kwd>sentiment</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Theoretical models suggest that the herd immunity threshold for SARS-CoV-2 requires at least two-thirds of the population to be immunized through either natural infection or vaccination [<xref ref-type="bibr" rid="ref1">1</xref>]. Though multiple safe and effective vaccines have been developed [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>], one significant challenge in achieving pandemic control is “vaccine hesitancy,” which ranges from mistrust to outright refusal of vaccination [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
      <p>Vaccine hesitancy extends beyond COVID-19 and is 1 of the 10 biggest threats to global health according to the World Health Organization (WHO). At its core, vaccine hesitancy is an issue of perception, rooted in the information individuals receive [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>Social media is an important source of both vaccine information and misinformation. Although vaccine-related tweets are predominantly positively polarized [<xref ref-type="bibr" rid="ref7">7</xref>], there is also substantial (possibly coordinated) misinformation [<xref ref-type="bibr" rid="ref8">8</xref>] that contributes to vaccine hesitancy [<xref ref-type="bibr" rid="ref9">9</xref>]. Further, the volume of tweeted fake news within a given country negatively correlates with its vaccine uptake [<xref ref-type="bibr" rid="ref10">10</xref>]. Antivaccination supporters on Twitter share more conspiracy theories and make greater use of emotional language than provaccination supporters [<xref ref-type="bibr" rid="ref11">11</xref>]. Moreover, vaccine discourse is highly politicized [<xref ref-type="bibr" rid="ref12">12</xref>], and the likelihood of endorsing misinformation is ideologically driven [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p>
      <p>Different sides of vaccine discourse prioritize different objective values: Arguments in favor of vaccines prioritize community, while arguments against vaccines focus on individual freedom [<xref ref-type="bibr" rid="ref15">15</xref>]. A high proportion of parents' opinions on vaccines expressed online is aggressive, accusatory, or inaccurate [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      <p>Major news outlets also play an important role in vaccine discourse [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Although several text mining studies have covered vaccines within specific regions [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref22">22</xref>], to the best of our knowledge, there are no large-scale text mining studies to date of vaccine front-page news headlines that encompass multiple countries focusing specifically on COVID-19.</p>
      <p>Here, we analyzed online news media coverage of COVID-19 vaccines. We used text mining analysis to estimate the volume of online vaccine news coverage during 3 time periods: (1) before the COVID-19 pandemic, (2) before the COVID-19 vaccine announcement, and (3) after the COVID-19 vaccine announcement. We used ~28 million front-page headlines collected from 11 different countries with a healthy online news media ecosystem, defined using SimilarWeb traffic and BBC media profiles [<xref ref-type="bibr" rid="ref23">23</xref>]. Because sentiment toward vaccines is influenced by the context in which they are mentioned, the most frequently mentioned topics were gathered alongside the most frequently mentioned companies and organizations. Our analysis aimed to inform future public health and vaccine communication, with a view to hopefully reducing vaccine hesitancy.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Curation of a Front-page News Article Database</title>
        <p>We analyzed the landing pages from major online news sources (ONSs) in countries with a healthy media ecosystem. The data are fully described in a previous study [<xref ref-type="bibr" rid="ref23">23</xref>] that focused on front-page news from 172 leading ONSs in 11 countries (Australia, Canada, France, Germany, Ireland, Italy, New Zealand, Russia, Spain, the United Kingdom, the United States) and an international category. The international category contained headlines from ONSs that were internationally distributed (eg, EuroNews or AlJazeera). The data used articles published from July 2015 to April 2021, which covered the following 3 time periods: (1) before the outbreak of COVID-19, (2) during the pandemic before the COVID-19 vaccine announcement, and (3) during the pandemic after the COVID-19 vaccine announcement. We took November 2020 as the cutoff date for the COVID-19 vaccine announcement, as from this point on, the press started covering SARS-CoV-2 vaccines following the announcement by BioNTech and Pfizer. We note this date applies to western countries, which are the subject of our study, and is less applicable globally. The updated data set included a total of 28,709,060 headlines, from which 14,638,278 were in the English language and 14,070,782 were in a language other than English.</p>
      </sec>
      <sec>
        <title>Identifying Vaccine Headlines</title>
        <p>Keywords were used to identify whether a given headline was vaccine-related. For non-English headlines, keywords were supplied by native speakers. For English headlines, we supplied the keywords ourselves. The keywords used can be found in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <p>Non-English headlines were stemmed using SnowballStemmer [<xref ref-type="bibr" rid="ref24">24</xref>] and case-folded (<xref ref-type="table" rid="table1">Table 1</xref>) to capture the equivalence class of different forms of words (eg, the German words Impfung, impfen, Impfgegner all map to impf). English headlines were lemmatized using TreeTagger [<xref ref-type="bibr" rid="ref25">25</xref>], all words were case-folded, and punctuation was removed, whereby words connected by a hyphen were separated into 2 words. English headlines were lemmatized to avoid misclassifications (eg “immunity” understood in a legal rather than a biomedical sense).</p>
        <p>The techniques used to identify vaccine headlines varied by language, and we used the same methodology as in our previous work [<xref ref-type="bibr" rid="ref23">23</xref>]. In French, Italian, Russian, and Spanish, titles and descriptions were tokenized, and if either the title or the description contained at least one keyword, the headline was labeled as a vaccine headline. In English and German, titles and descriptions were kept as strings, and a search was performed for keyword patterns. If a keyword pattern was present, the headline was designated as a vaccine headline (eg, in German, the prefix Impf-). Machine learning translation offers an alternative way to identify vaccine headlines across languages; however, this was beyond the scope of this work.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Keywords used to identify the vaccine headlines.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Language</td>
                <td>Keywords</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>English<break/>  <break/>  </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>vaccin</p>
                    </list-item>
                    <list-item>
                      <p>immunis</p>
                    </list-item>
                    <list-item>
                      <p>immuniz</p>
                    </list-item>
                    <list-item>
                      <p>anti vax</p>
                    </list-item>
                    <list-item>
                      <p>antivax</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>French</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>vaccin</p>
                    </list-item>
                    <list-item>
                      <p>antivaccin</p>
                    </list-item>
                    <list-item>
                      <p>immunis</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>German</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>impf</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Italian</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>vaccin</p>
                    </list-item>
                    <list-item>
                      <p>antivaccin</p>
                    </list-item>
                    <list-item>
                      <p>immunizz</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Russian</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>прививк</p>
                    </list-item>
                    <list-item>
                      <p>привива</p>
                    </list-item>
                    <list-item>
                      <p>вакцин</p>
                    </list-item>
                    <list-item>
                      <p>иммунизац</p>
                    </list-item>
                    <list-item>
                      <p>вакцинац</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Spanish</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>vacun</p>
                    </list-item>
                    <list-item>
                      <p>antivacun</p>
                    </list-item>
                    <list-item>
                      <p>inmuniz</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Splitting the Data Into 3 Vaccination-Specific Periods</title>
        <p>We divided the data into 3 time periods: (1) the pre-COVID-19 era, (2) during the pandemic before the COVID-19 vaccine announcement, and (3) during the pandemic after the COVID-19 vaccine announcement. This division of the data was based on clear changes within media coverage with respect to vaccines and COVID-19. On January 9, 2020, daily media coverage of the coronavirus began, so we chose this date as the end of the pre-COVID-19 era. We chose November 9, 2020, as the cut-off date separating the prevaccine and after-vaccine announcements. This resulted in the following 3 periods:</p>
        <list list-type="order">
          <list-item>
            <p>Before COVID-19: July 2015 to January 8, 2020</p>
          </list-item>
          <list-item>
            <p>Before the COVID-19 vaccine announcement: January 9, 2020, to November 9, 2020</p>
          </list-item>
          <list-item>
            <p>After the COVID-19 vaccine announcement: November 10, 2020, to April 2, 2021</p>
          </list-item>
        </list>
        <p>To identify changes in each period, the relative frequency of vaccines mentioned in the full data set, along with the relative frequency of headlines containing either “COVID-19” or “coronavirus,” was calculated at weekly intervals using equation 1.</p>
        <disp-formula>
          <graphic xlink:href="infodemiology_v2i2e35121_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>where |<italic>ONS<sub>Topic,Week</sub></italic>| is the number of headlines on a particular topic in a given week and |<italic>ONS<sub>Week</sub></italic>| is the number of headlines in that same given week. The relative frequency was calculated first with respect to vaccines, where all vaccine-related headlines were included, and second with respect to COVID-19, where all headlines containing either the keyword “coronavirus” or “COVID-19” were included.</p>
      </sec>
      <sec>
        <title>Topic Detection of the Vaccine Headlines in the 3 Periods Using BERTopic</title>
        <p>Topics were identified for 91 English ONSs using BERTopic. Topics were not identified for the non-English ONSs, as finding the optimal number of topics within non-English ONSs would require languages to be handled separately and would also require in-depth knowledge about each language. BERTopic is a topic modelling technique that uses a combination of transformers and c-TF-IDF to create dense clusters using HDBSCAN, where c-TF-IDF is a class-based TF-IDF that can be used to generate features from text [<xref ref-type="bibr" rid="ref26">26</xref>]. We chose to use BERTopic as it was previously successful in heterogeneous text mining [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>] and it offers multiple pretrained models. Additionally, scatterplots of the embeddings of the data from the 3 periods did not show a clear clustering of the headlines, which rules out several other topic detection techniques (please see Figures S1-S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <p>To remove patterns from the text input to BERTopic that could otherwise affect the model, all abbreviations, links, and names referring to the different newspapers were removed. Additionally, the word “news” was removed, along with words containing “immuniz,” “immunis,” and “vaccin,” which were used to extract the vaccine headlines. The phrases “anti vax” and “antivax” were retained, as they refer to resistance toward vaccination.</p>
        <p>Text input to BERTopic was normalized to reduce word variation. The headlines were lemmatized using TreeTagger combined with case-folding. TreeTagger is a tool for annotating text with part-of-speech and lemma information using a Markow tagger, which uses a decision tree to obtain reliable estimates. TreeTagger was also used to remove filler words from headlines by only using words tagged as either a noun (including proper nouns), verb, or adjective and removing words that contained little information about topics.</p>
        <p>We employed a 2-step evaluation method to identify the number of clusters reflecting the most common topics (Section 1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The pseudocode for this is illustrated in <xref rid="figure1" ref-type="fig">Figure 1</xref>. Evaluating topic similarity (step 2) was performed manually, as 2 topics might deal with the same subject but contain several seemingly different keywords or word combinations, which would make the model split them into 2 topics instead of 1 topic. Therefore, the decision of how to continue from step 2 was likewise done manually.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Pseudocode for the 2-step evaluation method to identify the number of clusters reflecting the most common topics.</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Named Entity Recognition of Vaccine Headlines Using SpaCy</title>
        <p>Named entity recognition (NER) identifies and categorizes words (or strings of words) for an entity, where an entity can be the name of a person, organization, location, or work of art. We used NER to determine the companies and organizations that were mentioned frequently in the context of vaccination. NER was performed on both English and non-English data using SpaCy with different pipelines depending on the language. SpaCy is an advanced natural language processing tool that is able to perform NER on multiple different languages using statistical models. Therefore, it uses previous training and predictions to decide whether a word or collection of words is a named entity and which kind of entity it most likely is [<xref ref-type="bibr" rid="ref29">29</xref>]. Pipelines were chosen according to the reported accuracy by SpaCy. In all cases, the most accurate pipeline was used, which were en_core_web_trf, de_core_news_lg, fr_core_news_lg, it_core_news_lg, ru_core_news_lg, and es_core_news_lg. The 2 first letters in each pipeline refer to the language for which it was trained.</p>
        <p>Entities such as “AstraZeneca-Oxford” or “Pfizer-BioNTech” were split to count as separate entities. The occurrences of “Johnson and Johnson” and “J&amp;J” were altered to “Johnson &amp; Johnson.”</p>
        <p>Individual entities were enumerated using case-folded entities. We created 2 bar plots (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), one containing the 30 most frequently occurring named entities from English ONSs and another containing the 30 most frequently named entities from non-English ONSs.</p>
      </sec>
      <sec>
        <title>Frequent N-grams With Respect to the Different Vaccine Manufacturers</title>
        <p>Changes in sentiment toward vaccination before and after the COVID-19 vaccine announcement were determined by assessing 7 frequently occurring vaccine manufacturers found using NER. A data set containing English headlines for each vaccine manufacturer was created, which was then assessed with respect to frequent bigrams and trigrams (referred to as n-grams henceforth). The lemmatized headlines created for the topic detection were used for this purpose.</p>
        <p>For all vaccines and periods, the 50 most frequent n-grams were assessed. In some cases, a combination of 2 bigrams, with almost the same count as a trigram, would combine to give that trigram. For instance, the bigrams (<italic>food, drug</italic>) and (<italic>drug, administr</italic>) combined give the trigram (<italic>food drug administr</italic>). This was caused by “Food and Drug Administration” in some cases being referred to as “Food and Drug Authority” or “Food and Drug Association.” Such bigrams were removed, keeping only the trigrams. Similar bigrams were excluded for “Food and Drug Administration,” “Centers for Disease Control,” and “European Medicines Agency.” Additionally, “FDA,” “CDC,” “NIH,” “WHO,” and “EMA” were commonly occurring abbreviations among the frequent words with respect to some vaccines, which were added to the number of occurrences of “Food and Drug Administration,” “Center for Disease Control,” “National Institute of Health,” “World Health Organization,” and “European Medicines Authority,” respectively. Other abbreviations such as “NHS,” “HHS,” and “PHE” were assessed with respect to frequent bigrams and trigrams. Likewise, if bigrams occurred the same number of times as a trigram containing the bigram, the bigram was removed.</p>
      </sec>
      <sec>
        <title>Sentiment Analysis of the Vaccine Headlines of 3 Periods Using VADER</title>
        <p>We performed sentiment analysis on English-language headlines using VADER [<xref ref-type="bibr" rid="ref30">30</xref>]. Before assessing sentiment values, each headline’s raw score was calculated using the positive and negative sentiment values in equation 2:</p>
        <disp-formula><italic>Raw<sub>score</sub></italic>=<italic>Positive<sub>score</sub></italic> - <italic>Negative<sub>score</sub></italic> <bold>(2)</bold></disp-formula>
        <p>The extent of negative or positive sentiment polarization varied between ONSs and over time. Therefore, a comparison of sentiment toward vaccines between the periods and ONSs on the raw sentiment values would not show whether a change in sentiment toward vaccines was due to an overall change in sentiment or, instead, due to a change in sentiment specifically toward vaccines. Therefore, to enable comparison of the periods and between the ONSs, each sentiment value for a vaccine headline was adjusted according to the overall average sentiment in the given ONS. The adjustment was done using the VADER sentiment values (either raw or compound, denoted by <italic>S<sub>ONS,Topic,Period</sub></italic>), subtracting the mean sentiment value for the same ONS, with respect to nonvaccine headlines in the same period (either raw or compound, denoted by <inline-graphic xlink:href="infodemiology_v2i2e35121_fig10.png" xlink:type="simple" mimetype="image"/>).</p>
        <p>This is referred to as the relative sentiment skew (RSS) and is given in equation 3:</p>
        <disp-formula>
          <graphic xlink:href="infodemiology_v2i2e35121_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>where <italic>ONS<sub>Topic,Period</sub></italic> is the collection of headlines of a given topic for a given ONS in a specific period, <inline-graphic xlink:href="infodemiology_v2i2e35121_fig12.png" xlink:type="simple" mimetype="image"/> is the collection of headlines not pertaining to that topic for that same ONS in all periods, <italic>h</italic> is a single headline, and <italic>sent(h)</italic> is the sentiment value of h, while <inline-graphic xlink:href="infodemiology_v2i2e35121_fig13.png" xlink:type="simple" mimetype="image"/> is the number of headlines not in the given topic for that same ONS in all periods. In this case, the topic in equation 3 is vaccines. The raw scores were used to RSS each headline, with respect to the 3 periods. These were illustrated in line plots, in which the cumulative frequency showed the proportion of negative and positive RSS values of a certain smaller value. Because of the nuanced nature of the news, we applied the same manual checks here as in our previous work to make sure sentiment annotations were correct [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>Of the 14,638,278 English-language headlines identified over all 3 data periods, 83,395 (0.6%) were found to be vaccine-related using the keywords defined in <xref ref-type="table" rid="table1">Table 1</xref>. Dividing these with respect to the 3 periods gave the following number of vaccine headlines within each period: (1) before COVID-19: 11,361; (2) before the COVID-19 vaccine announcement: 17,112; (3) after the COVID-19 vaccine announcement: 54,922.</p>
      <sec>
        <title>Large Increase in Ratio of Vaccine Headlines With the Rollout of COVID-19 Vaccines</title>
        <p>We calculated the percentage of vaccine coverage within newspaper headlines for each week within each time period of data collection, plotted in <xref rid="figure2" ref-type="fig">Figure 2</xref>. Before the pandemic, the percentage of vaccine headlines was low (0.1% across 172 ONSs). With the COVID-19 outbreak in early 2020, the proportion of vaccine headlines increased to an average of 4%.</p>
        <p>Increased reporting on vaccines during the second period coincided with the advent of COVID-19 reporting. The 10 most common topics in vaccine coverage in the 3 periods are shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. Causal connections cannot be established, as the COVID-19 coverage reached one-quarter of all front-page coverage with nuanced associations with reported topics [<xref ref-type="bibr" rid="ref23">23</xref>]. Unsurprisingly, the most common vaccine-related topics during the second and third time periods were related to the pandemic. Although COVID-19 increased vaccine news coverage, coverage of COVID-19 was not directly correlated with that of vaccine coverage (<xref rid="figure2" ref-type="fig">Figure 2</xref>).</p>
        <p>Rather than dropping to a stable level, as COVID-19 headlines did (<xref rid="figure2" ref-type="fig">Figure 2</xref>), the proportion of vaccine headlines increased from week 45 to week 47 of 2020 to between 6% and 8% and remained at this level until April 2, 2021. This increase is linked to the Pfizer and BioNTech press release on November 9, 2020, which reported 90% effectiveness in preventing COVID-19, paving the way for the rollout in the United Kingdom beginning on December 2, 2020.</p>
        <p>Relative frequencies of vaccine headlines were calculated for each period and each country (<xref rid="figure4" ref-type="fig">Figure 4</xref>). Relative frequencies for each country were similar, with very limited attention toward vaccines before the pandemic and a steep rise after the introduction of the first SARS-CoV-2 vaccine.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Percentage of headlines mentioning (A) vaccines and (B) "COVID-19" or "coronavirus" in the mainstream media over time, with the first and second cut-off dates (dotted and dashed vertical lines, respectively).</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>The 10 most common topics within vaccine-related articles during the 3 time periods. Purple cells highlight topics directly related to COVID-19, while red cells highlight topics that occur during more than one period. Notice that “Russia and COVID-19” is colored purple even though it occurs in multiple periods. EU: European Union; HPV: human papillomavirus.</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Relative vaccine frequency for each country including the international online news sources for each of the 3 periods: (A) before COVID-19, (B) before the COVID-19 vaccine announcement, and (C) after the COVID-19 vaccine announcement.</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Majority of Vaccine Reporting Had Positive Sentiment Polarization With the Outbreak of COVID-19 as Opposed to the Prepandemic Era</title>
        <p><xref rid="figure5" ref-type="fig">Figure 5</xref> shows the VADER sentiment scores for vaccine-associated headlines within each time period. The increased frequency of vaccine reporting during the pandemic led to an increase in the absolute number of negatively polarized articles, from 6698 in 2015-2019 to 28,552 in 2020-2021. Overall, however, polarization during the pandemic was majority positive (38% negatively polarized) as opposed to the prepandemic period, when 57% of articles were negatively polarized. <xref rid="figure3" ref-type="fig">Figure 3</xref> suggests that the difference in sentiment between pre-COVID-19 and post-COVID-19 vaccine coverage could be associated with COVID-19 coverage. This could be because COVID-19 became the dominant topic globally, accounting for one-quarter of all news during the pandemic.</p>
        <p>To investigate the difference in sentiment distribution between the 2 periods during the pandemic, we contrasted the topics and named entities mentioned in both periods. The period “Before the COVID-19 vaccine announcement” can largely be interpreted as the period in which all vaccines were under development, while “After the COVID-19 vaccine announcement” is the period in which some vaccines were rolled out and others were still under development. Although there is a difference between the periods before COVID-19 and after COVID-19, there was not a sizable sentiment discrepancy between the 2 periods during the pandemic (<xref rid="figure5" ref-type="fig">Figure 5</xref>).</p>
        <p>We further investigated the topic polarization of the articles relating to the COVID-19 vaccine development and rollout. We extracted articles associated with 2 topics from <xref rid="figure3" ref-type="fig">Figure 3</xref>: “Vaccine development” and “Vaccine rollout.” One could argue that “Vaccine production” (topic 10) should be merged with “Vaccine rollout” in line with our interpretation of the periods. However, we wanted to avoid manual intervention in topic annotations. The individual articles were extracted from the data giving 2 data sets of approximately the same size (846 and 814 headlines, respectively).</p>
        <p>We assessed sentiment polarization of the topics “Vaccine development” and “Vaccine rollout.” RSS of raw VADER sentiment for “Vaccine development” and “Vaccine rollout” is illustrated in <xref rid="figure6" ref-type="fig">Figure 6</xref>, which shows a change in vaccine sentiment between the development and trial phase and the rollout of the vaccines. <xref rid="figure6" ref-type="fig">Figure 6</xref> illustrates that, for “Vaccine development,” sentiment is overwhelmingly positive, with almost the entire interquartile range above the zero line. Of the headlines in “Vaccine development,” 23% had negative RSS, while 77% had positive RSS. This is very different from “Vaccine rollout,” for which 66% had negative RSS and only 34% had positive RSS. Additionally, the widest area lies above zero for “Vaccine development” and below zero for “Vaccine rollout.” Therefore, the RSS with the highest frequency is positive for “Vaccine development” and negative for “Vaccine rollout.” The largest and smallest RSS for the 2 topics are quite different: “Vaccine Development” lies in the range from –0.3 to just below 0.5, while “Vaccine rollout” lies in the range from –0.5 to 0.3; so, their RSS values are equally spread, but their ranges are differently situated. This suggests that the difference in sentiment distributions between the 2 COVID-19 periods could be attributed to more negative coverage during vaccine rollout.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Relative sentiment skew (y axis) of vaccine coverage in the 3 periods used in this study.</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Relative sentiment skew for the topics "Vaccine development" and "Vaccine rollout" using the raw sentiment value.</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Most Common Organizations Mentioned in the Context of COVID-19 Vaccines and Sentiment Toward Them</title>
        <p>To gain more granular insight into sentiment polarization during the pandemic period, we investigated the top entities mentioned. We employed SpaCy to perform NER, and the 30 most frequently mentioned companies or organizations for all 3 periods are illustrated in <xref rid="figure7" ref-type="fig">Figure 7</xref>.</p>
        <p>Unsurprisingly, the most common associations were between well-known COVID-19 vaccine manufacturers, namely “AstraZeneca” (in collaboration with Oxford), “Pfizer” (in collaboration with BioNTech), “BioNTech,” “Moderna,” “Oxford,”, “Johnson &amp; Johnson,” and “Sputnik V.” Though AstraZeneca and Oxford, as well as Pfizer and BioNTech, developed their vaccines as a partnership, they were frequently mentioned separately; thus, we opted to keep them as separate entities.</p>
        <p>Of the 30 most frequent named entities, in both English and non-English headlines, 16 occurred in both data sets, colored green in <xref rid="figure7" ref-type="fig">Figure 7</xref>. The nonoverlapping entities were mainly attributed to national organizations or companies. For instance, “NHS” and “HHS” are the National Health Service and the Department of Health and Human Services from the United Kingdom and United States, respectively, and were solely found among the 30 most frequent English entities. “Rospotrebnadzor” is the Federal Service for Surveillance on Consumer Rights in Russia, and “RDIF” and “PAH” are also Russian and were found solely among the 30 most frequent non-English entities. Additionally, company names are the same across different languages, whereas some national organizations are not; for instance, the abbreviation for the World Health Organization is WHO in English, while in French, it is OMS.</p>
        <p>The frequency at which vaccine manufacturers were mentioned within all news headlines increased from almost zero before COVID-19 to most frequently mentioned within the period after the vaccine announcement (<xref ref-type="table" rid="table2">Table 2</xref>). Therefore, vaccine manufacturers were assessed only within the COVID-19 pandemic.</p>
        <p>The most common associations with vaccine manufacturers indicated progress in development and rollout and were health-related (eg, side effects). Detailed analysis of the n-grams for each vaccine developer are in Section 2 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Vaccines by Moderna and Pfizer were chiefly associated with n-grams indicating progress of clinical trials and their rollouts. By contrast, top n-grams associated with AstraZeneca and Johnson &amp; Johnson were linked to side effect reporting (eg, unexplained illness, blood clot). Throughout the pandemic, Sputnik V was mentioned not in a medical context but rather frequently linked to Russia and Vladimir Putin, containing frequent n-grams like <italic>“</italic>Soviet Union,” “President Vladimir Putin,” and “Russia Soviet Union.”</p>
        <p>We investigated the extent to which the difference in the context of vaccine manufacturers influenced news article sentiment. In <xref rid="figure8" ref-type="fig">Figure 8</xref>, we plotted the proportion of negative and positive sentiments toward the vaccine manufacturer entities before and after the vaccine announcement. In the period before the COVID-19 vaccine announcement, entities appear to have similar negative polarizations, AstraZeneca and Johnson &amp; Johnson being noted as slight outliers with more negative coverage. After the COVID-19 vaccine announcement, AstraZeneca had a notably higher ratio of negative articles and a lower ratio of positive articles. Despite Johnson &amp; Johnson being associated with side effects (as per our n-gram analysis), AstraZeneca received notably worse press. We removed AstraZeneca coverage from <xref rid="figure5" ref-type="fig">Figure 5</xref> and <xref rid="figure6" ref-type="fig">Figure 6</xref> to test whether the higher associated volume of negative news influenced the slightly more negative polarization in the phase after the COVID-19 vaccine announcement. In both cases, we did not find that AstraZeneca was the main driver in more negatively polarized articles in that period (please see Tables S1 and S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>The 30 most frequent entities (companies and organizations) found in the (A) English and (B) non-English data. The green names are the organizations and companies that were found in both English and non-English data.</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The 21 different subsets created with respect to the different vaccines and periods, including the number of times each of the different manufacturers were mentioned within the news headlines in each subset (7 vaccine manufacturers in 3 periods).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="180"/>
            <col width="180"/>
            <col width="340"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td>Manufacturer</td>
                <td>Before COVID-19</td>
                <td>Before the COVID-19 vaccine announcement</td>
                <td>After the COVID-19 vaccine announcement</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>AstraZeneca</td>
                <td>3</td>
                <td>747</td>
                <td>5134</td>
              </tr>
              <tr valign="top">
                <td>BioNTech</td>
                <td>1</td>
                <td>163</td>
                <td>2118</td>
              </tr>
              <tr valign="top">
                <td>Johnson &amp; Johnson</td>
                <td>17</td>
                <td>332</td>
                <td>1050</td>
              </tr>
              <tr valign="top">
                <td>Moderna</td>
                <td>3</td>
                <td>647</td>
                <td>2256</td>
              </tr>
              <tr valign="top">
                <td>Oxford</td>
                <td>3</td>
                <td>1010</td>
                <td>2288</td>
              </tr>
              <tr valign="top">
                <td>Pfizer</td>
                <td>27</td>
                <td>513</td>
                <td>6042</td>
              </tr>
              <tr valign="top">
                <td>Sputnik V</td>
                <td>0</td>
                <td>153</td>
                <td>700</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Proportion of negative and positive sentiment polarization with respect to entities associated with vaccine manufacturing in the periods “Before the COVID-19 vaccine announcement” and “After the COVID-19 vaccine announcement”: (A) negative sentiment skew "Before the COVID-19 vaccine announcement," (B) positive sentiment skew "Before the COVID-19 vaccine announcement," (C) negative sentiment skew "After the COVID-19 vaccine announcement," (D) positive sentiment skew "Before the COVID-19 vaccine announcement".</p>
          </caption>
          <graphic xlink:href="infodemiology_v2i2e35121_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>We used text mining to study vaccine reporting on the front pages of top national news outlets. We demonstrated that reporting on vaccines increased in volume from coverage of around 0.1% on front pages to almost 4% of all headlines during the pandemic. Despite reporting covering the vaccines’ side effects, overall coverage can be classified as positive, in line with previous studies of social media that reported positive polarization of vaccine-related tweets [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>The news ecosystem accounts for 76% of the information people consume [<xref ref-type="bibr" rid="ref31">31</xref>], which can affect people’s behavior, for instance making them more hesitant toward vaccines. This can be exacerbated by circulation of misinformation [<xref ref-type="bibr" rid="ref21">21</xref>] and by vaccine reporting along partisan lines [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>However, news is only one facet of the entire media ecosystem, and much information is communicated via social media [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. Social media encourages active participation in the form of clicks, likes, retweets, and shares, which are then readily quantifiable by engagement. With news however, the engagement is much more nuanced, especially because of more passive information consumption when people merely scan headlines. Nonetheless, traditional news is still vital in forming opinions and, in many cases, constitutes the initial discourse on other platforms.</p>
      <p>We focused on analyzing headlines from a handful of western countries to provide a data-centric analysis of vaccine coverage across several countries. Similar studies have been conducted in individual countries (eg, Brazil [<xref ref-type="bibr" rid="ref22">22</xref>]) or other regions (eg, Africa [<xref ref-type="bibr" rid="ref20">20</xref>]). Our study encompasses countries that were among the first to manufacture and introduce the vaccine on a large scale (United States, Russia, Germany, United Kingdom). In these countries, policy makers had to navigate vaccine hesitancy and ongoing COVID-19 restrictions with sophisticated media coverage throughout the development and rollout phases.</p>
      <p>We analyzed how front-page headline vaccine reporting evolved during the COVID-19 pandemic. For the analysis, we made a set of assumptions that are associated with certain limitations. Our focus on the headlines in predominantly developed western countries underrepresents the situation faced in other parts of the world that were also affected by COVID-19, where vaccine hesitancy is compounded by inequality in vaccine manufacturing and distribution [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. We justify using headline information by virtue of normalizing heterogeneous long-form texts across different news sites and by capturing the behavior of passive scanning of headlines. However, this introduces a disconnect between the information in the full article that might not be reflected in an attention-attracting headline and thus leads to different information consumption by the reader. Within our data set, we opted for a keyword-based approach that was previously used to measure the extent of COVID-19 reporting [<xref ref-type="bibr" rid="ref23">23</xref>]. The approach is designed to increase the precision of identified headlines, though at the expense of recall. For instance, the headline “UK measles outbreak: 500,000 British children don’t have crucial jab - Daily Star. MORE than half a million children in the UK didn’t receive a…” was not extracted for the English vaccine data set, as it does not contain any of the chosen key words given in <xref ref-type="table" rid="table1">Table 1</xref>, even though it clearly pertains to vaccination. Developing a more complex topic model would not guarantee better performance and comparability between different languages, as one would have to develop a suitable model that captures the same linguistic nuances. Therefore, we resorted to simple mentions of basic vaccine-derived keywords to aid comparison across countries.</p>
      <p>Even though this approach underestimates the number of vaccine-related articles, COVID-19 vaccine reporting was still given central prominence, unlike before the outbreak when vaccines were covered only sporadically. Studying the volume of vaccine coverage motivated our division of the data into the 3 periods, before COVID-19, during COVID-19 but before the vaccines, and with COVID-19 vaccines. It is possible that our definitions of the second and third periods could have influenced our results. However, we found it reasonable to make these divisions according to the large rise in the relative frequency in vaccine headlines due to the Pfizer and BioNTech press release on November 9, 2020. This press release influenced all countries, while many of the other cornerstones in this period were more country-specific. For instance, the United Kingdom was the first country to approve the Pfizer-BioNTech vaccine on December 2, 2020, with the United States Food and Drug Administration approval of the Pfizer-BioNTech vaccine occurring on December 11, 2020.</p>
      <p>Our topic modelling and sentiment analysis showed that COVID-19 increased the proportion of vaccine headlines by more than an order of magnitude, from a negligible 0.1% to a formidable 4% during vaccine rollout across 172 ONSs. Reporting on vaccines prior to COVID-19 was negatively polarized. By contrast, vaccine-related reporting during the pandemic is positively polarized. Though we note a discrepancy in sentiment polarization pre- and post-COVID-19, this could be attributed to sampling bias post-COVID-19, as there was significantly more vaccine coverage. Moreover, sentiment polarization in the headlines might not relate directly to vaccines but rather to tangential topics. We therefore also analyzed the tendences in sentiments relating to specific concepts or entities, such as vaccine development or vaccine manufacturers.</p>
      <p>We performed in-depth sentiment analysis of the subtopic AstraZeneca, which received more negative coverage because of widely reported side effects and delivery issues. According to our analysis, however, such negative reporting was not significant enough to alter the overall positive narrative of vaccines in the news. Although The University of Oxford co-created the vaccine, it does not experience an equally large proportion of negative headlines as does AstraZeneca, which might be reflected in the media coverage frequency of the 2 with respect to vaccines. Although AstraZeneca is mentioned 5881 times during the pandemic, Oxford is mentioned 3298 times, mostly in the period before the COVID-19 vaccine announcement, while for AstraZeneca the majority is in the subsequent period. Therefore, AstraZeneca is more frequently connected with the vaccine in the media coverage than Oxford.</p>
      <p>Our findings study the online news media’s vaccine coverage and are also applicable more widely to general mistrust of authority and science. Although direct connections between news coverage and vaccine uptake are beyond the scope of this study, we have comprehensively characterized sentiment toward COVID-19 vaccination in the online news media. Future survey-based studies into vaccine hesitancy will hopefully benefit from our work, as it details the changing information landscape on which the public ultimately base their decisions. Our work is therefore also important for public health policy makers who require knowledge of the information that the public consumes when designing vaccine mandates.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary information.</p>
        <media xlink:href="infodemiology_v2i2e35121_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 1476 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">NER</term>
          <def>
            <p>named entity recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">NIHR</term>
          <def>
            <p>National Institute for Health Research</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ONS</term>
          <def>
            <p>online news source</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">RSS</term>
          <def>
            <p>relative sentiment skew</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">VEEPED</term>
          <def>
            <p>Vaccine Efficacy Evaluation for Priority Emerging Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>DL and SB acknowledge joint center funding from the UK Medical Research Council and Department for International Development (grant MR/R015600/1). DL acknowledges funding from the Vaccine Efficacy Evaluation for Priority Emerging Diseases (VEEPED) grant (ref. NIHR:PR-OD-1017-20002) from the National Institute for Health Research (NIHR). SB acknowledges funding from The Novo Nordisk Young Investigator Award (NNF20OC0059309), The Danish National Research Foundation via a chair position, and the NIHR Health Protection Research Unit in Modelling Methodology.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neagu</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The bumpy road to achieve herd immunity in COVID-19</article-title>
          <source>J Immunoassay Immunochem</source>
          <year>2020</year>
          <month>11</month>
          <day>01</day>
          <volume>41</volume>
          <issue>6</issue>
          <fpage>928</fpage>
          <lpage>945</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://paperpile.com/b/Ukzupd/8q4X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/15321819.2020.1833919</pub-id>
          <pub-id pub-id-type="medline">33086932</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Voysey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clemens</surname>
              <given-names>SAC</given-names>
            </name>
            <name name-style="western">
              <surname>Madhi</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Weckx</surname>
              <given-names>LY</given-names>
            </name>
            <name name-style="western">
              <surname>Folegatti</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Aley</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Angus</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Baillie</surname>
              <given-names>VL</given-names>
            </name>
            <name name-style="western">
              <surname>Barnabas</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Bhorat</surname>
              <given-names>QE</given-names>
            </name>
            <name name-style="western">
              <surname>Bibi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Briner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cicconi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Colin-Jones</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cutland</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Darton</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Dheda</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Duncan</surname>
              <given-names>CJA</given-names>
            </name>
            <name name-style="western">
              <surname>Emary</surname>
              <given-names>KRW</given-names>
            </name>
            <name name-style="western">
              <surname>Ewer</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fairlie</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Faust</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Finn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Heath</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hirsch</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hodgson</surname>
              <given-names>SHC</given-names>
            </name>
            <name name-style="western">
              <surname>Izu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jenkin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Joe</surname>
              <given-names>CCD</given-names>
            </name>
            <name name-style="western">
              <surname>Kerridge</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Koen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kwatra</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lazarus</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lawrie</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Lelliott</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Libri</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Lillie</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mallory</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mendes</surname>
              <given-names>AVA</given-names>
            </name>
            <name name-style="western">
              <surname>Milan</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>Minassian</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>McGregor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Morrison</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mujadidi</surname>
              <given-names>YF</given-names>
            </name>
            <name name-style="western">
              <surname>Nana</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Reilly</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Padayachee</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Pittella</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Plested</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Pollock</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Ramasamy</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Rhead</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schwarzbold</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Snape</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Sprinz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sutherland</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Tarrant</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Thomson</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Török</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Toshner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>DPJ</given-names>
            </name>
            <name name-style="western">
              <surname>Vekemans</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Villafana</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Watson</surname>
              <given-names>MEE</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Douglas</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>AVS</given-names>
            </name>
            <name name-style="western">
              <surname>Lambe</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>AJ</given-names>
            </name>
            <collab>Oxford COVID Vaccine Trial Group</collab>
          </person-group>
          <article-title>Safety and efficacy of the ChAdOx1 nCoV-19 vaccine (AZD1222) against SARS-CoV-2: an interim analysis of four randomised controlled trials in Brazil, South Africa, and the UK</article-title>
          <source>Lancet</source>
          <year>2021</year>
          <month>01</month>
          <day>09</day>
          <volume>397</volume>
          <issue>10269</issue>
          <fpage>99</fpage>
          <lpage>111</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0140-6736(20)32661-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)32661-1</pub-id>
          <pub-id pub-id-type="medline">33306989</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)32661-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7723445</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Polack</surname>
              <given-names>FP</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kitchin</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Absalon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gurtman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lockhart</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Perez</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez Marc</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Moreira</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Zerbini</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Swanson</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Roychoudhury</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Koury</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kalina</surname>
              <given-names>WV</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Frenck</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Hammitt</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Türeci</surname>
              <given-names>Ö</given-names>
            </name>
            <name name-style="western">
              <surname>Nell</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Schaefer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ünal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tresnan</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Mather</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dormitzer</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Şahin</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>KU</given-names>
            </name>
            <name name-style="western">
              <surname>Gruber</surname>
              <given-names>WC</given-names>
            </name>
            <collab>C4591001 Clinical Trial Group</collab>
          </person-group>
          <article-title>Safety and efficacy of the BNT162b2 mRNA Covid-19 vaccine</article-title>
          <source>N Engl J Med</source>
          <year>2020</year>
          <month>12</month>
          <day>31</day>
          <volume>383</volume>
          <issue>27</issue>
          <fpage>2603</fpage>
          <lpage>2615</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33301246"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa2034577</pub-id>
          <pub-id pub-id-type="medline">33301246</pub-id>
          <pub-id pub-id-type="pmcid">PMC7745181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baden</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>El Sahly</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Essink</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kotloff</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Frey</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Novak</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Diemert</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Spector</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Rouphael</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Creech</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>McGettigan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khetan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Segall</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Solis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brosz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fierro</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Neuzil</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corey</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Janes</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Follmann</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Marovich</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mascola</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Polakowski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ledgerwood</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Graham</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pajon</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Knightly</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Leav</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ivarsson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zaks</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Efficacy and safety of the mRNA-1273 SARS-CoV-2 vaccine</article-title>
          <source>N Engl J Med</source>
          <year>2021</year>
          <month>02</month>
          <day>04</day>
          <volume>384</volume>
          <issue>5</issue>
          <fpage>403</fpage>
          <lpage>416</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmoa2035389</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dubé</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Laberge</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Guay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bramadat</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bettinger</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Vaccine hesitancy: an overview</article-title>
          <source>Hum Vaccin Immunother</source>
          <year>2013</year>
          <month>08</month>
          <day>27</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>1763</fpage>
          <lpage>73</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23584253"/>
          </comment>
          <pub-id pub-id-type="doi">10.4161/hv.24657</pub-id>
          <pub-id pub-id-type="medline">23584253</pub-id>
          <pub-id pub-id-type="pii">24657</pub-id>
          <pub-id pub-id-type="pmcid">PMC3906279</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fridman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gershon</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gneezy</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 and vaccine hesitancy: A longitudinal study</article-title>
          <source>PLoS One</source>
          <year>2021</year>
          <month>4</month>
          <day>16</day>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>e0250123</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0250123"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0250123</pub-id>
          <pub-id pub-id-type="medline">33861765</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-35660</pub-id>
          <pub-id pub-id-type="pmcid">PMC8051771</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yousefinaghani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mubareka</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Papadopoulos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sharif</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An analysis of COVID-19 vaccine sentiments and opinions on Twitter</article-title>
          <source>Int J Infect Dis</source>
          <year>2021</year>
          <month>07</month>
          <volume>108</volume>
          <fpage>256</fpage>
          <lpage>262</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1201-9712(21)00462-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijid.2021.05.059</pub-id>
          <pub-id pub-id-type="medline">34052407</pub-id>
          <pub-id pub-id-type="pii">S1201-9712(21)00462-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8157498</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jemielniak</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Krempovych</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>An analysis of AstraZeneca COVID-19 vaccine misinformation and fear mongering on Twitter</article-title>
          <source>Public Health</source>
          <year>2021</year>
          <month>11</month>
          <volume>200</volume>
          <fpage>4</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34628307"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.puhe.2021.08.019</pub-id>
          <pub-id pub-id-type="medline">34628307</pub-id>
          <pub-id pub-id-type="pii">S0033-3506(21)00346-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8494632</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raciborski</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jankowski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gujski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pinkas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Samel-Kowalik</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Changes in attitudes towards the COVID-19 vaccine and the willingness to get vaccinated among adults in Poland: analysis of serial, cross-sectional, representative surveys, January-April 2021</article-title>
          <source>Vaccines (Basel)</source>
          <year>2021</year>
          <month>07</month>
          <day>29</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>A</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=vaccines9080832"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/vaccines9080832</pub-id>
          <pub-id pub-id-type="medline">34451957</pub-id>
          <pub-id pub-id-type="pii">vaccines9080832</pub-id>
          <pub-id pub-id-type="pmcid">PMC8402425</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Both rates of fake news and fact-based news on Twitter negatively correlate with the state-level COVID-19 vaccine uptake</article-title>
          <source>arXiv. Preprint posted online February 17, 2022</source>
          <year>2020</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2106.07435"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Germani</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Biller-Andorno</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>The anti-vaccination infodemic on social media: A behavioral analysis</article-title>
          <source>PLoS One</source>
          <year>2021</year>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>e0247642</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0247642"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0247642</pub-id>
          <pub-id pub-id-type="medline">33657152</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-39758</pub-id>
          <pub-id pub-id-type="pmcid">PMC7928468</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Righetti</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>The impact of the politicization of health on online misinformation and quality information on vaccines</article-title>
          <source>Italian Sociological Review</source>
          <year>2021</year>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.italiansociologicalreview.com/ojs/index.php?journal=ISR&amp;page=article&amp;op=view&amp;path%5B%5D=448"/>
          </comment>
          <pub-id pub-id-type="doi">10.13136/isr.v11i2.448</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Motta</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Republicans, not Democrats, are more likely to endorse anti-vaccine misinformation</article-title>
          <source>American Politics Research</source>
          <year>2021</year>
          <month>06</month>
          <day>14</day>
          <volume>49</volume>
          <issue>5</issue>
          <fpage>428</fpage>
          <lpage>438</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/1532673X211022639"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1532673x211022639</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baines</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ittefaq</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abwao</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>#Scamdemic, #Plandemic, or #Scaredemic: what Parler social media platform tells us about COVID-19 vaccine</article-title>
          <source>Vaccines (Basel)</source>
          <year>2021</year>
          <month>04</month>
          <day>22</day>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>421</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=vaccines9050421"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/vaccines9050421</pub-id>
          <pub-id pub-id-type="medline">33922343</pub-id>
          <pub-id pub-id-type="pii">vaccines9050421</pub-id>
          <pub-id pub-id-type="pmcid">PMC8146829</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kalimeri</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Beiró</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Urbinati</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bonanomi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rosina</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Human values and attitudes towards vaccination in social media</article-title>
          <year>2019</year>
          <conf-name>WWW '19: The Web Conference</conf-name>
          <conf-date>May 13-17, 2019</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3308560.3316489</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jenkins</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Vaccination discussion among parents on social media: a content analysis of comments on parenting blogs</article-title>
          <source>J Health Commun</source>
          <year>2020</year>
          <month>03</month>
          <day>03</day>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>232</fpage>
          <lpage>242</lpage>
          <pub-id pub-id-type="doi">10.1080/10810730.2020.1737761</pub-id>
          <pub-id pub-id-type="medline">32154770</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chadwick</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vaccari</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lambe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Loe</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderslott</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lewandowsky</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Conroy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>ARN</given-names>
            </name>
            <name name-style="western">
              <surname>Innocenti</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Waite</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Larkin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rosebrock</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jenner</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McShane</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Giubilini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Petit</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Online social endorsement and Covid-19 vaccine hesitancy in the United Kingdom</article-title>
          <source>Social Media + Society</source>
          <year>2021</year>
          <month>04</month>
          <day>05</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>205630512110088</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/20563051211008817"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20563051211008817</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lancaster</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rhodes</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>“A matter of time”: Evidence-making temporalities of vaccine development in the COVID-19 media landscape</article-title>
          <source>Time &amp; Society</source>
          <year>2021</year>
          <month>07</month>
          <day>15</day>
          <volume>31</volume>
          <issue>1</issue>
          <fpage>132</fpage>
          <lpage>154</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/0961463X211032201"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/0961463x211032201</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Motta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stecula</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The influence of partisan media in the face of global pandemic: how news media influenced COVID-19 vaccine hesitancy</article-title>
          <source>SocArXiv. Preprint posted online September 16, 2021</source>
          <year>2021</year>
          <pub-id pub-id-type="doi">10.31235/osf.io/xj4nq</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gbashi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Adebo</surname>
              <given-names>OA</given-names>
            </name>
            <name name-style="western">
              <surname>Doorsamy</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Njobeh</surname>
              <given-names>PB</given-names>
            </name>
          </person-group>
          <article-title>Systematic delineation of media polarity on COVID-19 vaccines in Africa: computational linguistic modeling study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>03</month>
          <day>16</day>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>e22916</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/3/e22916/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22916</pub-id>
          <pub-id pub-id-type="medline">33667172</pub-id>
          <pub-id pub-id-type="pii">v9i3e22916</pub-id>
          <pub-id pub-id-type="pmcid">PMC7968413</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stecula</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pickup</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>How populism and conservative media fuel conspiracy beliefs about COVID-19 and what it means for COVID-19 behaviors</article-title>
          <source>Research &amp; Politics</source>
          <year>2021</year>
          <month>02</month>
          <day>15</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>205316802199397</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/2053168021993979"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2053168021993979</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Melo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Figueiredo</surname>
              <given-names>CMS</given-names>
            </name>
          </person-group>
          <article-title>Comparing news articles and tweets about COVID-19 in Brazil: sentiment analysis and topic modeling approach</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>02</month>
          <day>10</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e24585</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/2/e24585/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24585</pub-id>
          <pub-id pub-id-type="medline">33480853</pub-id>
          <pub-id pub-id-type="pii">v7i2e24585</pub-id>
          <pub-id pub-id-type="pmcid">PMC7886485</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chelkowski</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Laydon</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xifara</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gibert</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mellan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schwämmle</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Röttger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hadsund</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatt</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Quantifying online news media coverage of the COVID-19 pandemic: text mining study and resource</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>06</month>
          <day>02</day>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>e28253</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/6/e28253/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/28253</pub-id>
          <pub-id pub-id-type="medline">33900934</pub-id>
          <pub-id pub-id-type="pii">v23i6e28253</pub-id>
          <pub-id pub-id-type="pmcid">PMC8174556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Steven Bird, Ewan Klein and Edward Loper: natural language processing with Python, analyzing text with the Natural Language Toolkit</article-title>
          <source>Lang Resources &amp; Evaluation</source>
          <year>2010</year>
          <month>5</month>
          <day>27</day>
          <volume>44</volume>
          <issue>4</issue>
          <fpage>421</fpage>
          <lpage>424</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/article/10.1007/s10579-010-9124-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10579-010-9124-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Amri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zenkouar</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Ezziyyani</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Amazigh POS Tagging Using TreeTagger: A Language Independant Model</article-title>
          <source>Advanced Intelligent Systems for Sustainable Development (AI2SD’2018). AI2SD 2018. Advances in Intelligent Systems and Computing, vol 915</source>
          <year>2019</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer International Publishing</publisher-name>
          <fpage>622</fpage>
          <lpage>632</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grootendorst</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Bertopic: Leveraging bert and c-tf-idf to create easily interpretable topics</article-title>
          <source>Version v0.7</source>
          <year>2021</year>
          <month>04</month>
          <day>01</day>
          <fpage>4</fpage>
          <pub-id pub-id-type="doi">10.1007/springerreference_179544</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ebeling</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Córdova Sáenz</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Nobre</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Becker</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The effect of political polarization on social distance stances in the Brazilian COVID-19 scenario</article-title>
          <source>JIDM</source>
          <year>2021</year>
          <month>08</month>
          <day>05</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>18</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://sol.sbc.org.br/journals/index.php/jidm/article/download/1889/1776"/>
          </comment>
          <pub-id pub-id-type="doi">10.5753/jidm.2021.1889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Valensise</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cinelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nadini</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Galeazzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peruzzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Etta</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zollo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Baronchelli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Quattrociocchi</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Lack of evidence for correlation between COVID-19 infodemic and vaccine acceptance</article-title>
          <source>arXiv. Preprint posted online September 14, 2021</source>
          <year>2020</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2107.07946"/>
          </comment>
          <pub-id pub-id-type="doi">10.31219/osf.io/sxd5t</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Honnibal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Montani</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Van</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>spaCy: Industrial-strength natural language processing in python</article-title>
          <source>Zenodo</source>
          <access-date>2022-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://spacy.io/">https://spacy.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hutto</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>VADER: A Parsimonious Rule-based Model for Sentiment Analysis of Social Media Text</article-title>
          <source>ERIC GILBERT</source>
          <year>2014</year>
          <access-date>2022-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://eegilbert.org/papers/icwsm14.vader.hutto.pdf">http://eegilbert.org/papers/icwsm14.vader.hutto.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Filter bubbles, echo chambers, and online news consumption</article-title>
          <source>PUBOPQ</source>
          <year>2016</year>
          <month>03</month>
          <day>22</day>
          <volume>80</volume>
          <issue>S1</issue>
          <fpage>298</fpage>
          <lpage>320</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/poq/article-abstract/80/S1/298/2223402"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/poq/nfw006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mullard</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>How COVID vaccines are being divvied up around the world</article-title>
          <source>Nature</source>
          <year>2020</year>
          <month>11</month>
          <day>30</day>
          <access-date>2022-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/d41586-020-03370-6">https://www.nature.com/articles/d41586-020-03370-6</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cioffi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cioffi</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccine: Risk of inequality and failure of public health strategies</article-title>
          <source>Ethics Med Public Health</source>
          <year>2021</year>
          <month>06</month>
          <volume>17</volume>
          <fpage>100653</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33758775"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jemep.2021.100653</pub-id>
          <pub-id pub-id-type="medline">33758775</pub-id>
          <pub-id pub-id-type="pii">S2352-5525(21)00030-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7972670</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
