<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Infodemiology</journal-id>
      <journal-title>JMIR Infodemiology</journal-title>
      <issn pub-type="epub">2564-1891</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v3i1e43700</article-id>
      <article-id pub-id-type="pmid">37903294</article-id>
      <article-id pub-id-type="doi">10.2196/43700</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Using COVID-19 Vaccine Attitudes Found in Tweets to Predict Vaccine Perceptions in Traditional Surveys: Infodemiology Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Cuomo</surname>
            <given-names>Raphael</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kreute</surname>
            <given-names>Frauke</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Steel</surname>
            <given-names>David</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mejova</surname>
            <given-names>Yelena</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mondal</surname>
            <given-names>Himel</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Sigalo</surname>
            <given-names>Nekabari</given-names>
          </name>
          <degrees>BSc, MPH, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>College of Information Studies</institution>
            <institution>University of Maryland</institution>
            <addr-line>4130 Campus Dr</addr-line>
            <addr-line>College Park, MD, 20742</addr-line>
            <country>United States</country>
            <phone>1 301 405 2033</phone>
            <email>nsigalo@terpmail.umd.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2749-4701</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Frias-Martinez</surname>
            <given-names>Vanessa</given-names>
          </name>
          <degrees>BSc, MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5114-7633</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>College of Information Studies</institution>
        <institution>University of Maryland</institution>
        <addr-line>College Park, MD</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Nekabari Sigalo <email>nsigalo@terpmail.umd.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>11</month>
        <year>2023</year>
      </pub-date>
      <volume>3</volume>
      <elocation-id>e43700</elocation-id>
      <history>
        <date date-type="received">
          <day>20</day>
          <month>10</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>16</day>
          <month>2</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>10</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Nekabari Sigalo, Vanessa Frias-Martinez. Originally published in JMIR Infodemiology (https://infodemiology.jmir.org), 30.11.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Infodemiology, is properly cited. The complete bibliographic information, a link to the original publication on https://infodemiology.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://infodemiology.jmir.org/2023/1/e43700" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Traditionally, surveys are conducted to answer questions related to public health but can be costly to execute. However, the information that researchers aim to extract from surveys could potentially be retrieved from social media, which possesses data that are highly accessible and lower in cost to collect.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to evaluate whether attitudes toward COVID-19 vaccines collected from the Household Pulse Survey (HPS) could be predicted using attitudes extracted from Twitter (subsequently rebranded X). Ultimately, this study aimed to determine whether Twitter can provide us with similar information to that observed in traditional surveys or whether saving money comes at the cost of losing rich data.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>COVID-19 vaccine attitudes were extracted from the HPS conducted between January 6 and May 25, 2021. Twitter’s streaming application programming interface was used to collect COVID-19 vaccine tweets during the same period. A sentiment and emotion analysis of tweets was conducted to examine attitudes toward the COVID-19 vaccine on Twitter. Generalized linear models and generalized linear mixed models were used to evaluate the ability of COVID-19 vaccine attitudes on Twitter to predict vaccine attitudes in the HPS.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The results revealed that vaccine perceptions expressed on Twitter performed well in predicting vaccine perceptions in the survey.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>These findings suggest that the information researchers aim to extract from surveys could potentially also be retrieved from a more accessible data source, such as Twitter. Leveraging Twitter data alongside traditional surveys can provide a more comprehensive and nuanced understanding of COVID-19 vaccine perceptions, facilitating evidence-based decision-making and tailored public health strategies.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>social media</kwd>
        <kwd>Twitter</kwd>
        <kwd>COVID-19</kwd>
        <kwd>vaccine</kwd>
        <kwd>surveys</kwd>
        <kwd>SARS-CoV-2</kwd>
        <kwd>vaccinations</kwd>
        <kwd>hesitancy</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The implementation of successful COVID-19 vaccine rollouts is essential for COVID-19 to remain under control globally. Although vaccines are essential in the global battle against COVID-19, vaccine hesitancy continues to be a barrier to effective and consistent vaccine rollout programs. According to the US Census Bureau’s Household Pulse Survey (HPS), individuals who reported being hesitant about receiving a COVID-19 vaccine cited concerns about side effects, safety, and a lack of trust in the vaccine or the government [<xref ref-type="bibr" rid="ref1">1</xref>]. Although the number of vaccine-hesitant individuals continues to decline, the fact that vaccine hesitancy still exists interferes with infection control through vaccination.</p>
        <p>Vaccine hesitancy has been fueled in part by the spread of vaccine misinformation, both in the media and on the web. In fact, the COVID-19 vaccine became a popular topic of discussion among social media users, with many individuals expressing their concerns about taking the vaccine on social media platforms [<xref ref-type="bibr" rid="ref2">2</xref>]. Amid the new normal of self-quarantine and lockdown, Twitter (subsequently rebranded X) quickly emerged as an important means of COVID-19 communications and discussion [<xref ref-type="bibr" rid="ref3">3</xref>]. This is in part due to the real-time availability of social media messaging, compared with traditional news reporting methods [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Twitter users often not only take to the platform to announce their own experiences and opinions about the pandemic but also see Twitter as a source of up-to-date information about the pandemic [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>The COVID-19 vaccine conversation on social media platforms has been both beneficial and detrimental to vaccination efforts across the world [<xref ref-type="bibr" rid="ref7">7</xref>]. Although the exact effect of social media on this unprecedented pandemic is difficult to quantify, there has been a constant battle between facts and misinformation, trust and fearmongering, and hope and anger [<xref ref-type="bibr" rid="ref8">8</xref>]. Research has shown that social media use plays a role in the low acceptance of vaccines [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Therefore, studying the public COVID-19 vaccine–related discussion on social media can help researchers better understand attitudes related to the vaccine [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <p>Traditionally, surveys are conducted to understand attitudes related to public health. For example, many studies leveraged surveys to examine COVID-19 vaccine hesitancy and compliance. In April 2020, Ward et al [<xref ref-type="bibr" rid="ref11">11</xref>] administered 4 web-based, nationally representative surveys to adults in France to identify the reasons why individuals would or would not take the COVID-19 vaccine once it became available. Researchers found that nearly a quarter of the respondents refused to take the COVID-19 vaccine once it was made available to them, citing reasons such as not trusting vaccines in general; concerns about the expedited vaccine development process; and a lack of fear of COVID-19, deeming the vaccine unnecessary.</p>
        <p>In the study by Wang et al [<xref ref-type="bibr" rid="ref12">12</xref>], a cross-sectional, self-administered survey was conducted to evaluate the COVID-19 vaccine intent among nurses in Hong Kong, China. Researchers found higher rates of vaccine hesitancy compared with vaccine acceptance, with nurses citing concerns about the safety and efficacy of the vaccines. A web-based survey conducted in the study by Ruiz and Bell [<xref ref-type="bibr" rid="ref13">13</xref>] attempted to identify the predictors of the intent to vaccinate against COVID-19 among Americans. Nearly 40% of the survey respondents refused to be vaccinated against COVID-19. Among the survey respondents, male, older, White, and married individuals and individuals with higher socioeconomic status were more likely to be vaccinated against COVID-19. Researchers also found that Republicans and Fox News viewers were less likely to get vaccinated, whereas individuals who were previously vaccinated for influenza were more likely to be vaccinated for COVID-19.</p>
        <p>Although several studies have examined COVID-19 vaccine attitudes through surveys, to our knowledge, no study has evaluated the ability of Twitter, a newer data source, to predict the attitudes reflected in traditionally collected surveys, such as the HPS. In recent years, researchers have looked at social media as a data source, citing the availability of more readily available data and no- or low-cost data collection efforts [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Traditional mail, field, and telephone interviewer surveys come with high costs of administration, and even though web-based surveys eliminate the costs of postage, paper, printing, and data entry, the newer web-based survey services may still cost up to thousands of dollars for 1 survey [<xref ref-type="bibr" rid="ref16">16</xref>]. Although relatively inexpensive compared with traditional surveys, web-based surveys are not always cost-effective [<xref ref-type="bibr" rid="ref16">16</xref>]. Evaluating the ability of information extracted from social media to predict information found in traditional surveys would suggest whether researchers may use this more cost-effective data source to provide similar rich information to that seen in traditional surveys or whether saving money comes at the cost of losing rich data.</p>
      </sec>
      <sec>
        <title>Study Overview</title>
        <p>The main objective of this study was to examine whether aggregate attitudes extracted from social media can predict vaccine attitudes collected via surveys. We hypothesized that social media may contain attitudes similar to those found in traditional surveys, with the added benefits of more readily available data and no- or low-cost data collection efforts. Predictive models of vaccine attitudes at the metropolitan level can be useful for 2 purposes. First, predictions can be used to identify metropolitan areas where vaccine hesitancy is high and create targeted campaigns to increase vaccination. Second, the relationships between sentiments and emotions and vaccine attitudes can be used to understand human perceptions of vaccines and create effective social media messages for vaccination campaigns. Specifically, we hypothesize that there is a direct, positive relationship between (1) positive sentiments and emotions found in Twitter data and the HPS and (2) negative sentiments and emotions found in Twitter data and the HPS survey.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection and Preprocessing</title>
        <sec>
          <title>HPS Data</title>
          <p>In April 2020, the US Census Bureau began releasing a cross-sectional nationally representative survey, the HPS, in an effort to assess the social and economic impacts of the COVID-19 pandemic on American households [<xref ref-type="bibr" rid="ref17">17</xref>]. The data from this survey were made publicly available in near real time with the purpose of informing federal and state response and recovery planning [<xref ref-type="bibr" rid="ref18">18</xref>]. The HPS sample was selected using a stratified random sampling method [<xref ref-type="bibr" rid="ref19">19</xref>]. Data were collected via computer-assisted telephone interviewing, a data collection method in which surveyors use computer software to conduct telephone interviews with respondents [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
          <p>On January 6, 2021, the US Census Bureau added COVID-19 vaccine–related questions to the HPS with the goal of understanding the factors contributing to vaccine hesitancy and compliance among Americans [<xref ref-type="bibr" rid="ref20">20</xref>] (<xref ref-type="table" rid="table1">Table 1</xref>). These questions assessed COVID-19 vaccine receipt, whether respondents received or planned to receive all required doses, intentions to get vaccinated, and reasons why respondents refused to get vaccinated.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>COVID-19–related Household Pulse Survey questions.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="340"/>
              <col width="370"/>
              <col width="290"/>
              <thead>
                <tr valign="top">
                  <td>Condition</td>
                  <td>Question</td>
                  <td>Responses</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Age &#62;18 years</td>
                  <td>Have you received a COVID-19 vaccine?</td>
                  <td>(1) Yes<break/>(2) No</td>
                </tr>
                <tr valign="top">
                  <td>Answered “yes” to “have you received a COVID-19 vaccine?”</td>
                  <td>Did you receive (or do you plan to receive) all required doses?</td>
                  <td>(1) Yes<break/>(2) No</td>
                </tr>
                <tr valign="top">
                  <td>Answered “no” to “have you received a COVID-19 vaccine?”</td>
                  <td>Once a vaccine to prevent COVID-19 is available to you, would you...</td>
                  <td>(1) Definitely get a vaccine<break/>(2) Probably get a vaccine<break/>(3) Be unsure about getting a vaccine<break/>(4) Probably not get a vaccine<break/>(5) Definitely not get a vaccine</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <p>Measures of vaccine compliance and hesitancy were assessed for each survey wave overall and in the metropolitan areas in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>. At the start of the survey period, January 2021, vaccine rollout in the United States had just begun, and with most people unvaccinated at that point, the intent to vaccinate was the only option. For the purposes of this analysis, individuals who answered that they would “definitely get a vaccine” or “probably get a vaccine” once available were considered <italic>vaccine compliant</italic>, and individuals who answered that they would “probably not get a vaccine,” or “definitely not get a vaccine” once available were considered <italic>vaccine hesitant</italic>.</p>
          <p>The HPS refers to the data collection cycles as <italic>weeks</italic> for consistency with earlier phases, even though the cycles actually span a 2-week collection period. For this study, we used the HPS microdata from weeks 22 to 30, which were collected between January 6 and May 25, 2021, with response rates ranging from 6.4% to 7.5% (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
          <boxed-text id="box1" position="float">
            <title>Targeted metropolitan areas for data collection (January to May 2021).</title>
            <list list-type="bullet">
              <list-item>
                <p>New York–Newark–Jersey City, New York–New Jersey–Pennsylvania metropolitan area</p>
              </list-item>
              <list-item>
                <p>Los Angeles–Long Beach–Anaheim, California metropolitan area</p>
              </list-item>
              <list-item>
                <p>Chicago-Naperville-Elgin, Illinois-Indiana-Wisconsin metropolitan area</p>
              </list-item>
              <list-item>
                <p>Dallas–Fort Worth–Arlington, Texas metropolitan area</p>
              </list-item>
              <list-item>
                <p>Houston–The Woodlands–Sugar Land, Texas metropolitan area</p>
              </list-item>
              <list-item>
                <p>Washington-Arlington-Alexandria, District of Columbia–Virginia–Maryland–West Virginia metropolitan area</p>
              </list-item>
              <list-item>
                <p>Miami–Fort Lauderdale–Pompano Beach, FL metropolitan area</p>
              </list-item>
              <list-item>
                <p>Philadelphia-Camden-Wilmington, Pennsylvania–New Jersey–Delaware–Maryland metropolitan area</p>
              </list-item>
              <list-item>
                <p>Atlanta–Sandy Springs–Alpharetta, Georgia metropolitan area</p>
              </list-item>
              <list-item>
                <p>Phoenix-Mesa-Chandler, Arizona metropolitan area</p>
              </list-item>
              <list-item>
                <p>Boston-Cambridge-Newton, Massachusetts–New Hampshire metropolitan area</p>
              </list-item>
              <list-item>
                <p>San Francisco–Oakland–Berkeley, California metropolitan area</p>
              </list-item>
              <list-item>
                <p>Detroit-Warren-Dearborn, Michigan metropolitan area</p>
              </list-item>
              <list-item>
                <p>Seattle-Tacoma-Bellevue, Washington metropolitan area</p>
              </list-item>
            </list>
          </boxed-text>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Household Pulse Survey data collection schedule.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="530"/>
              <col width="190"/>
              <col width="280"/>
              <thead>
                <tr valign="top">
                  <td>Collection dates</td>
                  <td>Week</td>
                  <td>Response rate (%)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>January 6-January 18, 2021</td>
                  <td>22</td>
                  <td>6.4</td>
                </tr>
                <tr valign="top">
                  <td>January 20-February 1, 2021</td>
                  <td>23</td>
                  <td>7.5</td>
                </tr>
                <tr valign="top">
                  <td>February 3-February 15, 2021</td>
                  <td>24</td>
                  <td>7.3</td>
                </tr>
                <tr valign="top">
                  <td>February 17-March 1, 2021</td>
                  <td>25</td>
                  <td>7.3</td>
                </tr>
                <tr valign="top">
                  <td>March 3-March 15, 2021</td>
                  <td>26</td>
                  <td>7.4</td>
                </tr>
                <tr valign="top">
                  <td>March 17-March 29, 2021</td>
                  <td>27</td>
                  <td>7.2</td>
                </tr>
                <tr valign="top">
                  <td>April 14-April 26, 2021</td>
                  <td>28</td>
                  <td>6.6</td>
                </tr>
                <tr valign="top">
                  <td>April 28-May 10, 2021</td>
                  <td>29</td>
                  <td>7.4</td>
                </tr>
                <tr valign="top">
                  <td>May 12-May 24, 2021</td>
                  <td>30</td>
                  <td>6.8</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
        <sec>
          <title>Twitter Data</title>
          <p>To align with the HPS data collection period outlined in <xref ref-type="table" rid="table2">Table 2</xref>, the Twitter Streaming application programming interface, which provides access to a random sample of 1% of publicly available tweets, was used to collect tweets from the metropolitan areas represented in the HPS (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>) from January to May 2021. All tweets had <italic>place</italic> information (usually city and state). The place information found in tweets was used to determine the metropolitan area associated with each tweet. Next, to extract tweets related to COVID-19 vaccines, tweets were further filtered by matching variations of vaccine-related keywords, such as <italic>vaccine, pfizer, moderna, johnson &#38; johnson,</italic> and <italic>dose</italic>. The tweet sample was further preprocessed to minimize <italic>noise</italic> resulting from tweets that matched our vaccine-related keywords but did not necessarily reflect the thoughts and opinions of individual Twitter users. For example, companies often promote job postings and advertisements on Twitter using targeted hashtags in hopes of reaching their target audience. To prevent these tweets from adding noise to the sample, tweets related to job postings and advertisements were removed by excluding tweets with hashtags and keywords such as <italic>#jobs</italic>, <italic>#hiring</italic>, and <italic>#ad</italic>.</p>
        </sec>
        <sec>
          <title>Sentiment and Emotion Analysis of Tweets</title>
          <p>To capture the attitudes found in COVID-19 vaccine–related tweets, a sentiment and emotion analysis of all tweets was conducted using the Natural Language Understanding Research Consortium (NRC) lexicon from the <italic>Syuzhet</italic> package in R (R Core Team) [<xref ref-type="bibr" rid="ref21">21</xref>]. The NRC lexicon, developed by Saif Mohammad, contains a list of manually labeled English words and their associations with negative and positive sentiments and common human emotions, such as trust, fear, sadness, surprise, and disgust [<xref ref-type="bibr" rid="ref22">22</xref>]. The <italic>Syuzhet</italic> package applies the NRC lexicon by independently evaluating and rating each word or expression within a tweet [<xref ref-type="bibr" rid="ref23">23</xref>]. The <italic>get_nrc_sentiment</italic> function was applied to all tweets to calculate the valence of 8 different emotions (fear, joy, anticipation, anger, disgust, sadness, surprise, and trust), along with the overall positive and negative sentiments, toward the COVID-19 vaccine. To assess the accuracy of the sentiment classifier, a random sample of 1000 tweets was selected for manual classification as having a positive or negative sentiment. Among the 1000 tweets in the random sample, 734 (73.4%) were accurately classified by the automated sentiment classifier.</p>
          <p>The percentage of tweets expressing the 8 emotions, along with the percentage of tweets expressing a positive or negative sentiment, was calculated at the metropolitan level. For the purposes of this analysis, we used the proportion of tweets with a positive sentiment and positive emotions toward vaccines as a proxy to capture vaccine compliance among Twitter users, and the proportion of tweets with a negative sentiment and negative emotions toward vaccines was used as a proxy to capture vaccine hesitancy among Twitter users.</p>
        </sec>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>Statistical analysis was conducted using the R software packages <italic>betareg</italic> and <italic>GLMMadaptive</italic> [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. To determine whether COVID-19 vaccine attitudes on Twitter can predict the proportion of COVID-19 vaccine perceptions ultimately expressed in the HPS (unweighted), both generalized linear models (GLMs) and generalized linear mixed models (GLMMs) were constructed (<xref ref-type="table" rid="table3">Table 3</xref>). The models were developed using a total of 126 data points, including proportional vaccine compliance and hesitancy proxies from 14 metropolitan areas across 9 survey waves.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Regression models evaluating the relationship between Twitter sentiments and emotions and HPS<sup>a</sup> vaccine hesitancy and compliance.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="180"/>
            <col width="500"/>
            <col width="320"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td>Features</td>
                <td>Outcome</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Model 1a (GLM<sup>b</sup>)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Percentage of positive sentiment</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of joy</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of surprise</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of trust</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of anticipation</p>
                    </list-item>
                  </list>
                  <list list-type="bullet">
                    <list-item>
                      <p>Percentage of survey week (fixed effect)</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of metropolitan area (fixed effect)</p>
                    </list-item>
                  </list>
                </td>
                <td>Percentage of vaccine-compliant HPS respondents</td>
              </tr>
              <tr valign="top">
                <td>Model 1b (GLMM<sup>c</sup>)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Percentage of positive sentiment</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of joy</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of surprise</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of trust</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of anticipation</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of percentage of survey week (fixed effect)</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of metropolitan area (random effect)</p>
                    </list-item>
                  </list>
                </td>
                <td>Percentage of vaccine-compliant HPS respondents</td>
              </tr>
              <tr valign="top">
                <td>Model 2a (GLM)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Percentage of negative sentiment</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of anger</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of disgust</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of sadness</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of fear</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of anticipation</p>
                    </list-item>
                    <list-item>
                      <p>Survey week (fixed effect)</p>
                    </list-item>
                    <list-item>
                      <p>Metropolitan area (fixed effect)</p>
                    </list-item>
                  </list>
                </td>
                <td>Percentage of vaccine-hesitant HPS respondents</td>
              </tr>
              <tr valign="top">
                <td>Model 2b (GLMM)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Percentage of negative sentiment</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of anger</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of disgust</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of sadness</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of fear</p>
                    </list-item>
                    <list-item>
                      <p>Percentage of anticipation</p>
                    </list-item>
                  </list>
                  <list list-type="bullet">
                    <list-item>
                      <p>Survey week (fixed effect)</p>
                    </list-item>
                    <list-item>
                      <p>Metropolitan area (random effect)</p>
                    </list-item>
                  </list>
                </td>
                <td>Percentage of vaccine-hesitant HPS respondents</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>HPS: Household Pulse Survey.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>GLM: generalized linear model.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>GLMM: generalized linear mixed model.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>GLMs were implemented with both time and geographic location as fixed effects, whereas the GLMMs were a multilevel approach with time as a fixed effect and metropolitan area as a random effect. The main reason behind this dual modeling choice is that random effects can capture the latent variation in the data that cannot be explained by fixed effects or the error term [<xref ref-type="bibr" rid="ref26">26</xref>]. Random effects represent factors with multiple levels, such as geographic location, and possess distinct components that vary across these levels. Random effects prove especially valuable when dealing with hierarchical or nested data structures, where observations are not independent but grouped at a higher level, and enable us to account for similarities within these groups and prevent overfitting [<xref ref-type="bibr" rid="ref25">25</xref>]. However, if there is limited variability across locations, including location as a random effect may lead to unstable estimates or unreliable inferences [<xref ref-type="bibr" rid="ref27">27</xref>]. In such cases, it is often better to treat location as a fixed effect or aggregate the data at a higher level. Thus, we constructed both GLMs and GLMMs to assess the prediction power of using metropolitan areas as either fixed or random effects. We fit beta regression models with the logit link, which is the most appropriate for modeling proportional data [<xref ref-type="bibr" rid="ref28">28</xref>]. In beta regression, the outcome variable is assumed to follow a beta distribution. Prior to evaluating the models, we conducted assumption checks and checked for multicollinearity and outliers to determine whether the necessary conditions were met. These model diagnostics are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>As shown in <xref ref-type="table" rid="table3">Table 3</xref>, we constructed 2 models to predict vaccine compliance (models 1a, GLM, and 1b, GLMM) and 2 models to predict vaccine hesitancy (models 2a, GLM, and 2b, GLMM). In model 1a, we fit a GLM in which the predictor variables were each of the 5 positive Twitter-derived sentiment and emotion features and the outcome variable was the proportion of vaccine-compliant HPS respondents. This model controlled for survey week (time) and metropolitan area as fixed effects. In model 1b, to account for variations in time and location, we fit a GLMM with each of the 5 positive Twitter-derived sentiment and emotion features and survey week (time) as fixed effects and metropolitan area as a random effect.</p>
        <p>By contrast, in model 2a, we fit a GLM in which the predictor variables were each of the 6 negative Twitter-derived sentiment and emotion features and the outcome variable was the proportion of vaccine-hesitant HPS respondents. This model controlled for survey week (time) and metropolitan area as fixed effects. In model 2b, we fit a GLMM with each of the 6 negative Twitter-derived sentiment and emotion features and survey week (time) as fixed effects and metropolitan area as a random effect. As anticipation can be perceived as both positive and negative, this emotion was included as a feature in all models.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This project does not meet the definition of human participant research under the purview of the University of Maryland Institutional Review Board according to federal regulations, section 45CFR46.102(e) [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Descriptive Statistics</title>
        <p>There were a total of 92,453 tweets from 32,645 users across the 14 metropolitan areas in this study (<xref ref-type="table" rid="table4">Table 4</xref>). The Los Angeles–Long Beach–Anaheim metropolitan area had the largest representation of tweets (21,500/92,453, 23.26%), whereas the New York–Newark–New Jersey metropolitan area had the largest representation of users (18,400/32,645, 56.36%). The maximum number of tweets by a single individual was 274 (from a user in the New York–Newark–New Jersey metropolitan area). There were a total of 240,242 respondents to the HPS across the 14 metropolitan areas and 9 waves in this study, with the largest sample being the sample from the Washington-Arlington-Alexandria metropolitan area (<xref ref-type="table" rid="table5">Table 5</xref>).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Number of tweets (N=92,453) and users (N=32,645) by metropolitan area (January to May 2021).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="130"/>
            <col width="120"/>
            <col width="230"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td>Metropolitan area, state</td>
                <td>Tweets, n (%)</td>
                <td>Users, n (%)</td>
                <td>Weekly number of tweets, mean (SD)</td>
                <td>Weekly number of users, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Atlanta–Sandy Springs–Alpharetta, Georgia</td>
                <td>4234 (4.58)</td>
                <td>1542 (4.72)</td>
                <td>470 (186)</td>
                <td>254 (106)</td>
              </tr>
              <tr valign="top">
                <td>Boston-Cambridge-Newton, Massachusetts–New Hampshire</td>
                <td>3019 (3.27)</td>
                <td>1298 (3.98)</td>
                <td>335 (133)</td>
                <td>218 (83)</td>
              </tr>
              <tr valign="top">
                <td>Chicago-Naperville-Elgin, Illinois-Indiana-Wisconsin</td>
                <td>5821 (6.3)</td>
                <td>2561 (7.84)</td>
                <td>647 (252)</td>
                <td>426 (160)</td>
              </tr>
              <tr valign="top">
                <td>Dallas–Fort Worth–Arlington, Texas</td>
                <td>6203 (6.71)</td>
                <td>2299 (7.04)</td>
                <td>689 (265)</td>
                <td>371 (133)</td>
              </tr>
              <tr valign="top">
                <td>Detroit-Warren-Dearborn-Michigan</td>
                <td>1082 (1.17)</td>
                <td>518 (1.59)</td>
                <td>120 (56)</td>
                <td>84 (40)</td>
              </tr>
              <tr valign="top">
                <td>Houston–The Woodlands–Sugar Land, Texas</td>
                <td>5125 (5.54)</td>
                <td>2421 (7.42)</td>
                <td>569 (234)</td>
                <td>388 (145)</td>
              </tr>
              <tr valign="top">
                <td>Los Angeles–Long Beach–Anaheim, California</td>
                <td>21,500 (23.26)</td>
                <td>5429 (16.63)</td>
                <td>2389 (983)</td>
                <td>891 (344)</td>
              </tr>
              <tr valign="top">
                <td>Miami–Fort Lauderdale–Pompano Beach, Florida</td>
                <td>1954 (2.11)</td>
                <td>849 (2.6)</td>
                <td>217 (74)</td>
                <td>131 (40)</td>
              </tr>
              <tr valign="top">
                <td>New York–Newark–Jersey City, New York–New Jersey–Pennsylvania</td>
                <td>18,400 (19.9)</td>
                <td>7259 (22.24)</td>
                <td>2044 (683)</td>
                <td>1272 (400)</td>
              </tr>
              <tr valign="top">
                <td>Philadelphia-Camden-Wilmington, Pennsylvania–New Jersey–Delaware-Maryland</td>
                <td>3652 (3.95)</td>
                <td>1406 (4.31)</td>
                <td>406 (156)</td>
                <td>250 (88)</td>
              </tr>
              <tr valign="top">
                <td>Phoenix-Mesa-Chandler, Arizona</td>
                <td>4778 (5.17)</td>
                <td>1573 (4.82)</td>
                <td>531 (183)</td>
                <td>260 (81)</td>
              </tr>
              <tr valign="top">
                <td>San Francisco–Oakland–Berkeley, California</td>
                <td>6376 (6.9)</td>
                <td>2008 (6.15)</td>
                <td>708 (261)</td>
                <td>347 (116)</td>
              </tr>
              <tr valign="top">
                <td>Seattle-Tacoma-Bellevue, Washington</td>
                <td>3089 (3.34)</td>
                <td>1333 (4.08)</td>
                <td>343 (157)</td>
                <td>227 (103)</td>
              </tr>
              <tr valign="top">
                <td>Washington-Arlington-Alexandria, District of Columbia–Virginia–Maryland–West Virginia</td>
                <td>7220 (7.81)</td>
                <td>2419 (7.41)</td>
                <td>802 (313)</td>
                <td>436 (155)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Number of survey respondents (N=240,242) by city.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="450"/>
            <col width="290"/>
            <col width="260"/>
            <thead>
              <tr valign="top">
                <td>Metropolitan area, state</td>
                <td>Respondents, n (%)</td>
                <td>Weekly number of respondents, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Atlanta–Sandy Springs–Alpharetta, Georgia</td>
                <td>12,611 (5.25)</td>
                <td>1261 (48)</td>
              </tr>
              <tr valign="top">
                <td>Boston-Cambridge-Newton, Massachusetts–New Hampshire</td>
                <td>20,078 (8.36)</td>
                <td>2008 (121)</td>
              </tr>
              <tr valign="top">
                <td>Chicago-Naperville-Elgin, Illinois-Indiana-Wisconsin</td>
                <td>16,044 (6.68)</td>
                <td>1604 (89)</td>
              </tr>
              <tr valign="top">
                <td>Dallas–Fort Worth–Arlington, Texas</td>
                <td>15,859 (6.6)</td>
                <td>1586 (88)</td>
              </tr>
              <tr valign="top">
                <td>Detroit-Warren-Dearborn-Michigan</td>
                <td>12,149 (5.06)</td>
                <td>1215 (88)</td>
              </tr>
              <tr valign="top">
                <td>Houston–The Woodlands–Sugar Land, Texas</td>
                <td>14,179 (5.9)</td>
                <td>1418 (125)</td>
              </tr>
              <tr valign="top">
                <td>Los Angeles–Long Beach–Anaheim, California</td>
                <td>17,006 (7.08)</td>
                <td>1701 (101)</td>
              </tr>
              <tr valign="top">
                <td>Miami–Fort Lauderdale–Pompano Beach, Florida</td>
                <td>11,641 (4.85)</td>
                <td>1164 (67)</td>
              </tr>
              <tr valign="top">
                <td>New York–Newark–Jersey City, New York–New Jersey–Pennsylvania</td>
                <td>19,730 (8.21)</td>
                <td>1973 (124)</td>
              </tr>
              <tr valign="top">
                <td>Philadelphia-Camden-Wilmington, Pennsylvania–New Jersey–Delaware–Maryland</td>
                <td>20,240 (8.42)</td>
                <td>2024 (162)</td>
              </tr>
              <tr valign="top">
                <td>Phoenix-Mesa-Chandler, Arizona</td>
                <td>14,027 (5.84)</td>
                <td>1403 (106)</td>
              </tr>
              <tr valign="top">
                <td>San Francisco–Oakland–Berkeley, California</td>
                <td>17,787 (7.4)</td>
                <td>1779 (78)</td>
              </tr>
              <tr valign="top">
                <td>Seattle-Tacoma-Bellevue, Washington</td>
                <td>18,615 (7.75)</td>
                <td>1862 (106)</td>
              </tr>
              <tr valign="top">
                <td>Washington-Arlington-Alexandria, District of Columbia–Virginia–Maryland–West Virginia</td>
                <td>30,276 (12.6)</td>
                <td>3028 (227)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Attitudes Toward COVID-19 Vaccines in Twitter Data</title>
        <p>A sentiment analysis classified most tweets (50,415/92,453, 54.53% of tweets overall) across all metropolitan areas as having a positive sentiment (<xref ref-type="table" rid="table6">Table 6</xref>). The Washington-Arlington-Alexandria metropolitan area had the largest proportion of tweets with a positive sentiment (53,715/92,453, 58.1%), whereas the Miami–Fort Lauderdale–Pompano Beach metropolitan area had the lowest proportion of tweets with a positive sentiment (47,059/92,453, 50.9%). Tweets with a negative sentiment held the smallest proportions across all metropolitan areas (13,970/92,453, 15.11% of tweets overall). The Los Angeles–Long Beach–Anaheim metropolitan area had the largest proportion of tweets with a negative sentiment (15,162/92,453, 16.4%), whereas the Miami–Fort Lauderdale–Pompano Beach metropolitan area had the lowest proportion of tweets with a negative sentiment (11,926/92,453, 12.9%).</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Distribution of sentiments and emotions found in COVID-19 vaccine tweets (N=92,453; January to May 2021).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Sentiment or emotion</td>
                <td>Tweets, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Positive sentiment</td>
                <td>50,415 (54.53)</td>
              </tr>
              <tr valign="top">
                <td>Trust</td>
                <td>41,317 (44.69)</td>
              </tr>
              <tr valign="top">
                <td>Anticipation</td>
                <td>32,127 (34.75)</td>
              </tr>
              <tr valign="top">
                <td>Fear</td>
                <td>27,227 (29.45)</td>
              </tr>
              <tr valign="top">
                <td>Sadness</td>
                <td>24,935 (26.97)</td>
              </tr>
              <tr valign="top">
                <td>Joy</td>
                <td>24,241 (26.22)</td>
              </tr>
              <tr valign="top">
                <td>Anger</td>
                <td>21,671 (23.44)</td>
              </tr>
              <tr valign="top">
                <td>Surprise</td>
                <td>20,562 (22.24)</td>
              </tr>
              <tr valign="top">
                <td>Disgust</td>
                <td>14,746 (15.95)</td>
              </tr>
              <tr valign="top">
                <td>Negative</td>
                <td>13,970 (15.11)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>The emotion analysis revealed trust as the predominantly expressed emotion in COVID-19 vaccine tweets across all metropolitan areas (41,317/92,453, 44.69%). The most perceived negative emotion across all metropolitan areas was fear (27,227/92,453, 29.45%). The least perceived positive emotions were joy (24,241/92,453, 26.22%) and surprise (20,562/92,453, 22.24%), whereas the least perceived negative emotions were anger (21,671/92,453, 23.44%) and disgust (14,746/92,453, 15.95%). Examples of tweets expressing positive, neutral, and negative sentiments are presented in <xref ref-type="boxed-text" rid="box2">Textbox 2</xref>.</p>
        <boxed-text id="box2" position="float">
          <title>Examples of tweets expressing a positive or negative sentiment toward COVID-19 vaccines.</title>
          <p>
            <bold>Positive sentiments</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>“Feeling blessed to be healthy this birthday. My two biggest presents are coming in the next week: Inauguration and my second vaccine.”</p>
            </list-item>
            <list-item>
              <p>“Hubby received his first vaccine does this morning-the sense of relief is for real, folks. #vaccinated”</p>
            </list-item>
            <list-item>
              <p>“With my granddaughter Aurora, Andy, and Elliot. I can see them again and give them a hug now that I am fully Covid 19 vaccinated. I have had both shots plus over 2 weeks since shot two. Thank you President Biden.”</p>
            </list-item>
            <list-item>
              <p>“My mom gets her second dose Sunday, big relief!”</p>
            </list-item>
            <list-item>
              <p>“I love so much that I got vaccinated today.”</p>
            </list-item>
            <list-item>
              <p>“Proud to work for you @bswhealth-my parents received their COVID vaccines this week at BUMC and said it was so quick and easy and the staff were so friendly! Thank you for taking care of them.”</p>
            </list-item>
          </list>
          <p>
            <bold>Negative sentiments</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>“This is from the Pfizer v-a-c-c-i-n-e. Please understand these shots cause harm. Injury is REAL &#38; not rare. It’s a shame these poor people are being gaslighted, &#38; media giants are censoring them.”</p>
            </list-item>
            <list-item>
              <p>“They way my people been bugging me about this d*mn vaccine, I’m not getting that s*it.”</p>
            </list-item>
            <list-item>
              <p>“No way!! No more lockdowns!! No vaccines!!! Oh and if your so concerned about the virus how about no illegals!!! Thank goodness for New Hampshire and Florida!! Go out.”</p>
            </list-item>
            <list-item>
              <p>Clearly you are ignorant of the fact that they said even if you get the vaccine you still have to wear a mask, social distance &#38; deal with all the same bull shit draconian orders. Even after blatant evidence you still want to get it. Heres 100% evidence of brain wash mind control.”</p>
            </list-item>
            <list-item>
              <p>“I am 80. You can have my vaccine. I refuse to get one. I take 2 grams of vitamin C hourly. That makes me IMMUNE. Read: Linus Pauling. No mask. I am out every day working &#38; walking in the park. Paul Kangas 4 Governor.”</p>
            </list-item>
            <list-item>
              <p>“F the stupid vaccine.”</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Attitudes Toward COVID-19 Vaccines in the HPS Data</title>
        <p>Most survey respondents (127,833/240,242, 53.21%) across all metropolitan areas indicated that they received a COVID-19 vaccine, ranging from 50.2% (7041/14,027) of the survey respondents in the Phoenix-Mesa-Chandler metropolitan area to 56.4% (10,032/17,787) of the survey respondents in the San Francisco–Oakland–Berkeley metropolitan area (<xref ref-type="table" rid="table7">Table 7</xref>). Among the respondents who indicated that they received a COVID-19 vaccine, the majority (65,195/127,833, 51%) also indicated that they received or planned to receive all required doses. Among the respondents who indicated that they had not received a COVID-19 vaccine, the majority (89,759/112,409, 79.85% combined) indicated that they <italic>probably</italic> or <italic>definitely</italic> would get vaccinated), ranging from 48% (6733/14,027) of the survey respondents in the Phoenix-Mesa-Chandler metropolitan area to 75.2% (13,376/17,787) of the survey respondents in the San Francisco–Oakland–Berkeley metropolitan area. For the purposes of this analysis, individuals who answered they that would “definitely get a vaccine” or “probably get a vaccine” once available were considered <italic>vaccine compliant</italic>, and individuals who answered that they would “probably not get a vaccine” or “definitely not get a vaccine” once available were considered <italic>vaccine hesitant</italic>.</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Distribution of survey responses (unweighted; January to May 2021).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="620"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Question and responses</td>
                <td>Respondents, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Have you received a COVID-19 vaccine? (N=</bold>
                  <bold>240,242)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>127,833 (53.21)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No or did not answer</td>
                <td>112,409 (46.79)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Did you receive (or do you plan to receive) all required doses? (n=127,833)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>65,195 (51)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No or did not answer</td>
                <td>62,638 (49)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Once a vaccine to prevent COVID-19 is available to you, would you... (n=112,409)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Definitely get a vaccine</td>
                <td>69,233 (61.59)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Probably get a vaccine</td>
                <td>20,526 (18.26)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Be unsure about getting a vaccine</td>
                <td>3114 (2.77)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Probably not get a vaccine</td>
                <td>10,836 (9.64)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Definitely not get a vaccine</td>
                <td>8700 (7.74)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Predicting HPS Vaccine Attitudes Using Twitter-Based Attitudes</title>
        <p>We evaluated the performance of each GLM in terms of R-squared value and root mean square error (RMSE). Model 1a revealed significant associations (<italic>P</italic>&#60;.001) between the percentage of vaccine-compliant HPS respondents and the percentage of tweets expressing a positive sentiment and trust (<xref ref-type="table" rid="table8">Table 8</xref>). The R-squared value for the vaccine-compliant GLM (model 1a) was 94.11%, and the RMSE was 0.053, which suggests that we can predict vaccine compliance in the HPS fairly well using positive sentiments and emotions found on Twitter. The GLM coefficients showed that an increase in the percentage of tweets expressing a positive sentiment (<italic>P</italic>&#60;.001) was significantly associated with an increase in the percentage of vaccine-compliant HPS respondents. By contrast, an increase in the percentage of tweets expressing trust (<italic>P</italic>&#60;.001) was significantly associated with a decrease in the percentage of vaccine-compliant HPS respondents.</p>
        <table-wrap position="float" id="table8">
          <label>Table 8</label>
          <caption>
            <p>Model results.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="300"/>
            <col width="0"/>
            <col width="210"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="0"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Model and features</td>
                <td colspan="2">β coefficient (SE)</td>
                <td colspan="2"><italic>P</italic> value</td>
                <td colspan="3">R-squared (%)</td>
                <td colspan="2">Root mean square error</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>Model 1a (GLM<sup>a</sup>)</bold>
                </td>
                <td colspan="3">94.1</td>
                <td>0.053</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of positive sentiment</td>
                <td colspan="2">5.007 (.865)</td>
                <td colspan="2">&#60;.001<sup>b</sup></td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of joy</td>
                <td colspan="2">.043 (1.482)</td>
                <td colspan="2">.98</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of surprise</td>
                <td colspan="2">1.084 (1.163)</td>
                <td colspan="2">.35</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of trust</td>
                <td colspan="2">−4.696 (.865)</td>
                <td colspan="2">&#60;.001<sup>b</sup></td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of anticipation</td>
                <td colspan="2">.930 (1.197)</td>
                <td colspan="2">.44</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Model 1b (GLMM<sup>c</sup>)</bold>
                </td>
                <td colspan="3">82.5</td>
                <td>0.062</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of positive sentiment</td>
                <td colspan="2">4.791 (.865)</td>
                <td colspan="2">&#60;.001<sup>b</sup></td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of joy</td>
                <td colspan="2">.271 (1.483)</td>
                <td colspan="2">.86</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of surprise</td>
                <td colspan="2">.942 (1.157)</td>
                <td colspan="2">.42</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of trust</td>
                <td colspan="2">−4.529 (.906)</td>
                <td colspan="2">&#60;.001<sup>b</sup></td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of anticipation</td>
                <td colspan="2">1.239 (1.107)</td>
                <td colspan="2">.26</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Model 2a (GLM)</bold>
                </td>
                <td colspan="3">93.2</td>
                <td>0.01</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of negative sentiment</td>
                <td colspan="2">−1.340 (.581)</td>
                <td colspan="2">.02<sup>b</sup></td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of anger</td>
                <td colspan="2">.382 (.556)</td>
                <td colspan="2">.49</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of disgust</td>
                <td colspan="2">−.356 (.612)</td>
                <td colspan="2">.56</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of sadness</td>
                <td colspan="2">−1.011 (.625)</td>
                <td colspan="2">.11</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of fear</td>
                <td colspan="2">.715 (.532)</td>
                <td colspan="2">.18</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of anticipation</td>
                <td colspan="2">−.382 (.369)</td>
                <td colspan="2">.30</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Model 2b (GLMM)</bold>
                </td>
                <td colspan="3">9.4</td>
                <td>0.032</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of negative sentiment</td>
                <td colspan="2">−1.334 (.617)</td>
                <td colspan="2">.03<sup>b</sup></td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of anger</td>
                <td colspan="2">.425 (.587)</td>
                <td colspan="2">.47</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of disgust</td>
                <td colspan="2">−.312 (.657)</td>
                <td colspan="2">.64</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of sadness</td>
                <td colspan="2">−1.015 (.662)</td>
                <td colspan="2">.13</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of fear</td>
                <td colspan="2">.643 (.567)</td>
                <td colspan="2">.26</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Percentage of anticipation</td>
                <td colspan="2">−.456 (.388)</td>
                <td colspan="2">.24</td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table8fn1">
              <p><sup>a</sup>GLM: generalized linear model.</p>
            </fn>
            <fn id="table8fn2">
              <p><sup>b</sup>Statistically significant results (α=.05).</p>
            </fn>
            <fn id="table8fn3">
              <p><sup>c</sup>GLMM: generalized linear mixed model.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>When we compared the vaccine-compliant GLM (model 1a) with the vaccine-compliant GLMM with metropolitan area as a random effect (model 1b), we observed a lower R-squared value (82.5%) and higher RMSE (0.062). Model 1b results also showed that an increase in the percentage of tweets expressing a positive sentiment (<italic>P</italic>&#60;.001) was significantly associated with an increase in the percentage of vaccine-compliant HPS respondents. By contrast, an increase in the percentage of tweets expressing trust (<italic>P</italic>&#60;.001) was significantly associated with a decrease in the percentage of vaccine-compliant HPS respondents.</p>
        <p>Model 2a revealed significant associations (<italic>P</italic>&#60;.05) between the percentage of vaccine-hesitant HPS respondents and the percentage of tweets expressing a negative sentiment. The R-squared value for the vaccine-hesitant GLM (model 2a) was similar to that of the vaccine-compliant GLM (93.17%). However, the vaccine-hesitant GLMM showed a much lower R-squared value (9.4%) and slightly higher RMSE (0.032). When compared with the vaccine-hesitant GLM (model 2a), whose only difference from the GLMM was the use of metropolitan area as a random effect, these results revealed that metropolitan area, as a fixed effect, and negative tweet sentiment (statistically significant in both model 2a and 2b) contributed to the majority of the variation in the percentage of vaccine-hesitant HPS respondents. When looking at the regressors, the results of both the vaccine-hesitant models, model 2a and 2b, showed that an increase in the percentage of tweets expressing a negative sentiment (<italic>P</italic>=.02 and <italic>P</italic>=.03, respectively) was associated with a decrease in the percentage of vaccine-hesitant HPS respondents.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we sought to determine whether the sentiments and emotions found in COVID-19 vaccine tweets can predict the vaccine hesitancy and compliance expressed in the US Census Bureau’s HPS. Depending on the model, GLMs and GLMMs showed significant relationships between (1) the percentage of vaccine-compliant HPS respondents and percentage of tweets expressing a positive sentiment and trust and (2) the percentage of vaccine-hesitant HPS respondents and percentage of tweets expressing a negative sentiment. Positive perceptions expressed on Twitter performed well in predicting positive perceptions in the survey for both GLMs and GLMMs, whereas negative perceptions expressed on Twitter performed well in predicting negative perceptions in the survey only for the GLM.</p>
      </sec>
      <sec>
        <title>Study Findings in Context</title>
        <p>The main objective of this study was to examine whether aggregate attitudes extracted from social media can predict vaccine attitudes collected via surveys. Specifically, we hypothesized that there is a direct, positive relationship between (1) positive sentiments found in Twitter and the HPS survey and (2) negative sentiments found in Twitter and the HPS survey. We expected to see a positive relationship between positive sentiments and emotions on Twitter and vaccine compliance in the HPS, as suggested in a previous study that showed a positive relationship between positive sentiment scores in COVID-19 vaccine–related tweets and an increase in vaccination rates [<xref ref-type="bibr" rid="ref30">30</xref>]. The results of both vaccine-compliant models revealed, as expected, significant positive relationships between the percentage of vaccine-compliant HPS respondents and percentage of tweets expressing a positive sentiment. However, in both vaccine-compliant models, the direction of one of the statistically significant relationships that were revealed was not what we expected. Both vaccine-compliant models revealed a significant inverse relationship between the vaccine-compliant measure in the HPS and percentage of tweets expressing trust.</p>
        <p>We also expected to see a positive relationship between negative sentiments and emotions on Twitter and vaccine hesitancy in the HPS. Although not significant, the percentages of tweets expressing anger and fear were, as expected, positively related to increases in vaccine hesitancy for both GLM and GLMM. However, the vaccine-hesitant GLM and GLMM both revealed a significant inverse relationship between the vaccine-hesitant measure in the HPS and percentage of tweets expressing a negative sentiment.</p>
        <p>The unexpected direction of the relationship between some vaccine perceptions in the survey and vaccine perceptions found on Twitter might be explained via ecological fallacy. An ecological fallacy occurs when an inference is made about the relationship between variables at an aggregate or a group level (eg, the level of a neighborhood, city, or country) based solely on the relationship between the same variables at an individual level [<xref ref-type="bibr" rid="ref31">31</xref>]. This can be problematic because the relationship between variables at the group level may differ from the relationship between the same variables at the individual level because of factors such as aggregation bias and other contextual factors.</p>
        <p>Another possible explanation for the unexpected findings on some of the relationships between vaccine perceptions in the survey and vaccine perceptions found on Twitter could be the possibility that some individuals’ web-based personas may not match their reality. For example, an individual might be obligated to get a vaccine because of their job or an upcoming travel, making them vaccine compliant, but rant about it on the web. In our sample data, this type of person would be classified as <italic>provaccine</italic> instead of <italic>antivaccine</italic> in the HPS but would also contribute to the negative perceptions found on Twitter. These findings also align with prior research that suggested an individual’s web-based persona may differ from their offline identity [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. This offline identity is often limited by physical, emotional, and financial circumstances that may be beyond an individual’s control [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. However, individuals have complete control over the identity they choose to present on the web [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. The inverse relationship between the vaccine-hesitant measure in the HPS and percentage of tweets expressing a negative sentiment may have also been due to the use of sarcasm in tweets, where the text itself contradicts what is actually meant by the user [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
        <p>The findings of this study contribute to the literature in 2 ways. First, although many studies have examined COVID-19 vaccine acceptance by extracting information from either surveys or social media, to our knowledge, no study has evaluated the relationship between these vastly different data sources. Unlike social media data collection, surveys come with postage, paper, printing, interviewer, and data entry costs, making them costly to administer [<xref ref-type="bibr" rid="ref39">39</xref>]. Evaluating the relationship between the attitudes found in surveys and those found on social media allows researchers to determine whether social media data can be trusted to reveal the same information that can be extracted from traditional surveys or whether there is a risk of losing important information in exchange for cutting costs. In this study, we found that COVID-19 vaccine attitudes in the HPS, measured as vaccine compliance and hesitancy, can be predicted using social media attitudes toward vaccines, measured via sentiments and emotions toward vaccines. The results of this study support the efforts of researchers, who over the past few years have looked at social media as a data source, citing the availability of readily available data and no- or low-cost data collection efforts [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        <p>This study makes further contributions by revealing the sentiments and emotions found in tweets across different metropolitan areas. This builds upon several other studies that leveraged natural language processing (NLP) methods, such as sentiment analysis, emotion analysis, and topic modeling, to examine vaccine-related perceptions [<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>]. In this study, we found that most tweets expressed a provaccine sentiment, across all metropolitan areas. However, many tweets also expressed negative feelings and anticipations. This supports previous work, where researchers found many discussions about vaccine hesitancy but ultimately found most tweets to have a positive sentiment [<xref ref-type="bibr" rid="ref45">45</xref>]. This study also revealed trust as the dominant emotion found in tweets. This supports the results of a prior study that also found trust to be the dominant emotion expressed in tweets during an earlier period [<xref ref-type="bibr" rid="ref46">46</xref>]. A comparison of these results shows that the vaccine conversation on Twitter remained relatively consistent over time.</p>
        <p>Comparing COVID-19 vaccine perceptions on Twitter with attitudes in traditional public health surveys offers several benefits. Twitter serves as a platform for immediate and widespread dissemination of information. Analyzing vaccine perceptions on Twitter can help identify emerging issues or concerns related to COVID-19 vaccines at an early stage. This early detection allows public health authorities to address misconceptions, respond to emerging challenges, and promptly adapt their communication strategies. For example, the study results suggest that both models may be beneficial when deciding which cities to implement vaccine campaigns in, and the vaccine-compliant model can be used to better understand the role sentiments play in vaccination behaviors. This type of model can be used to craft effective social media messages related to COVID-19 vaccination.</p>
        <p>Twitter provides a platform for a wide range of voices and opinions, including those of individuals with varying backgrounds, beliefs, and experiences. Comparing Twitter data with survey data allows for the exploration of diverse perspectives and can uncover viewpoints that may not be captured through traditional surveys alone. This broader range of perspectives enhances the understanding of the complexities surrounding vaccine perceptions. Twitter data also allow for the real-time monitoring of public sentiment and reactions toward COVID-19 vaccines. This timely information can provide valuable insights into evolving trends, emerging concerns, and the impact of specific events or interventions. By comparing Twitter discussions with survey responses, researchers can identify shifts in public opinion and monitor the effectiveness of public health communication strategies in real time.</p>
        <p>Comparison with Twitter data can complement the findings of traditional surveys, providing a more comprehensive understanding of vaccine perceptions. Twitter data can provide contextual information, qualitative insights, and real-world examples that enrich the analysis of survey responses. The combination of both sources offers a more nuanced and holistic understanding of public attitudes toward COVID-19 vaccines.</p>
        <p>This study provides further evidence for the benefits of using social media data for public health research. The overarching contribution of this work suggests the adoption of alternative data sources and NLP techniques to assist in public health decision-making.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>Considering the limitations of this study may lead to future, related work. This study emphasizes the use of Twitter as a data source, but the lack of representation among Twitter users leads to bias in the sample and contributes to sampling errors. For example, Twitter users tend to be younger, be more educated, have higher incomes, and be more liberal [<xref ref-type="bibr" rid="ref47">47</xref>]. The lack of representation among Twitter users suggests the limited generalizability of the results to the larger population. Adding to this lack of representation is the limited sample of tweets available to the public via the Twitter Streaming application programming interface, which makes available a random sample of 1% of all tweets made by Twitter users at any given time [<xref ref-type="bibr" rid="ref48">48</xref>]. In addition, in studies assessing COVID-19 vaccine perceptions using social media data, individuals who do not have access to social media are systematically excluded from the analysis sample.</p>
        <p>The lack of demographic information on Twitter users is also a limitation to using Twitter as a data source. The absence of demographic information, such as age, gender, income, and education makes it challenging to understand the characteristics of the Twitter users who generate the data. This lack of information may lead to biased or incomplete analyses and limit the generalizability of the findings. In addition, the absence of demographic data makes it difficult to compare Twitter data with data from other sources that do contain demographic information, such as survey data. Despite these limitations, Twitter data can still be useful in certain contexts.</p>
        <p>It should also be acknowledged that the HPS data are also subject to sampling errors due to sample design, nonresponse, weighting adjustments, and measurement errors [<xref ref-type="bibr" rid="ref49">49</xref>]. As a result, the true relationship between aggregate attitudes extracted from social media and vaccine attitudes collected via surveys may be different from what was revealed in this study.</p>
        <p>Future studies should endeavor to use other NLP approaches, such as topic modeling, to compare public perceptions of the COVID-19 vaccine on social media with those found in surveys. The survey used in this study, the HPS, presented respondents with in-depth questions related to why they were vaccine hesitant, so applying topic models to tweets may reveal some of the same attitudes and themes as those expressed in the survey. Future studies may also involve pulling data from other social media platforms, such as Facebook, and comparing the overall perceptions reflected across all media.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The ongoing COVID-19 pandemic requires consistent monitoring and data-driven public health policies. To slow the spread of the virus, public health officials have stressed that vaccines are essential in the worldwide battle against COVID-19. However, vaccine hesitancy continues to be a barrier to effective and consistent vaccine rollout programs. Prior efforts have used surveys to gauge attitudes toward the COVID-19 vaccine, but this study suggests that these public perceptions may also be extracted from a readily available, low-cost data source, social media. In this study, we validated social media as a data source by evaluating the relationship between the attitudes expressed among Twitter users and attitudes expressed among respondents to the HPS as well as the ability of attitudes expressed among Twitter users to predict vaccine compliance and hesitancy among the HPS respondents. Leveraging Twitter data alongside traditional surveys can provide a more comprehensive and nuanced understanding of COVID-19 vaccine perceptions, facilitating evidence-based decision-making and tailored public health strategies.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Model diagnostics.</p>
        <media xlink:href="infodemiology_v3i1e43700_app1.doc" xlink:title="DOC File , 3561 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">GLM</term>
          <def>
            <p>generalized linear model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">GLMM</term>
          <def>
            <p>generalized linear mixed model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HPS</term>
          <def>
            <p>Household Pulse Survey</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NRC</term>
          <def>
            <p>Natural Language Understanding Research Consortium</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RMSE</term>
          <def>
            <p>root mean square error</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Household pulse survey COVID-19 vaccination tracker</article-title>
          <source>United States Census Bureau</source>
          <year>2021</year>
          <month>12</month>
          <day>22</day>
          <access-date>2022-01-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/library/visualizations/interactive/household-pulse-survey-covid-19-vaccination-tracker.html">https://www.census.gov/library/visualizations/interactive/household-pulse-survey-covid-19-vaccination-tracker.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garett</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Online misinformation and vaccine hesitancy</article-title>
          <source>Transl Behav Med</source>
          <year>2021</year>
          <month>12</month>
          <day>14</day>
          <volume>11</volume>
          <issue>12</issue>
          <fpage>2194</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34529080"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/tbm/ibab128</pub-id>
          <pub-id pub-id-type="medline">34529080</pub-id>
          <pub-id pub-id-type="pii">6371221</pub-id>
          <pub-id pub-id-type="pmcid">PMC8515268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pershad</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hangge</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Albadawi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Oklu</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Social medicine: Twitter in healthcare</article-title>
          <source>J Clin Med</source>
          <year>2018</year>
          <month>05</month>
          <day>28</day>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>121</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jcm7060121"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jcm7060121</pub-id>
          <pub-id pub-id-type="medline">29843360</pub-id>
          <pub-id pub-id-type="pii">jcm7060121</pub-id>
          <pub-id pub-id-type="pmcid">PMC6025547</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chunara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Andrews</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Social and news media enable estimation of epidemiological patterns early in the 2010 Haitian cholera outbreak</article-title>
          <source>Am J Trop Med Hyg</source>
          <year>2012</year>
          <month>01</month>
          <volume>86</volume>
          <issue>1</issue>
          <fpage>39</fpage>
          <lpage>45</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22232449"/>
          </comment>
          <pub-id pub-id-type="doi">10.4269/ajtmh.2012.11-0597</pub-id>
          <pub-id pub-id-type="medline">22232449</pub-id>
          <pub-id pub-id-type="pii">86/1/39</pub-id>
          <pub-id pub-id-type="pmcid">PMC3247107</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Torrens</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Frias-Martinez</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Understanding citizens' and local governments' digital communications during natural disasters: the case of snowstorms</article-title>
          <source>Proceedings of the 2017 ACM on Web Science Conference</source>
          <year>2017</year>
          <month>06</month>
          <conf-name>WebSci '17: ACM Web Science Conference</conf-name>
          <conf-date>June 25-28, 2017</conf-date>
          <conf-loc>Troy, NY</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3091478.3091502</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ball-Rokeach</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>DeFleur</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <article-title>A dependency model of mass-media effects</article-title>
          <source>Commun Res</source>
          <year>1976</year>
          <month>1</month>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1177/009365027600300101</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marston</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>P-C</given-names>
            </name>
            <name name-style="western">
              <surname>Girishan Prabhu</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sharaievska</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Browning</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Earle</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ivan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kanozia</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Öztürk Çalıkoğlu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Arslan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bilir-Koca</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Alexandra Silva</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Buttigieg</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Großschädl</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Schüttengruber</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Digital practices by citizens during the COVID-19 pandemic: findings from an international multisite study</article-title>
          <source>JMIR Ment Health</source>
          <year>2023</year>
          <month>03</month>
          <day>06</day>
          <volume>10</volume>
          <fpage>e41304</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2023//e41304/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/41304</pub-id>
          <pub-id pub-id-type="medline">36877558</pub-id>
          <pub-id pub-id-type="pii">v10i1e41304</pub-id>
          <pub-id pub-id-type="pmcid">PMC9994468</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Charquero-Ballester</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Nissen</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Bechmann</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Different types of COVID-19 misinformation have different emotional valence on Twitter</article-title>
          <source>Big Data Soc</source>
          <year>2021</year>
          <month>09</month>
          <day>22</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>205395172110412</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/20539517211041279"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20539517211041279</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bonnevie</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gallegos-Jeffrey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goldbarg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Byrd</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Smyser</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Quantifying the rise of vaccine opposition on Twitter during the COVID-19 pandemic</article-title>
          <source>J Commun Healthc</source>
          <year>2020</year>
          <month>12</month>
          <day>15</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>12</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1080/17538068.2020.1858222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deiner</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Fathy</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Niemeyer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ackley</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lietman</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Porco</surname>
              <given-names>TC</given-names>
            </name>
          </person-group>
          <article-title>Facebook and Twitter vaccine sentiment in response to measles outbreaks</article-title>
          <source>Health Informatics J</source>
          <year>2019</year>
          <month>09</month>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>1116</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/1460458217740723?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1460458217740723</pub-id>
          <pub-id pub-id-type="medline">29148313</pub-id>
          <pub-id pub-id-type="pmcid">PMC5930144</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Alleaume</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Peretti-Watel</surname>
              <given-names>P</given-names>
            </name>
            <collab>COCONEL Group</collab>
          </person-group>
          <article-title>The French public's attitudes to a future COVID-19 vaccine: the politicization of a public health issue</article-title>
          <source>Soc Sci Med</source>
          <year>2020</year>
          <month>11</month>
          <volume>265</volume>
          <fpage>113414</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33038683"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.socscimed.2020.113414</pub-id>
          <pub-id pub-id-type="medline">33038683</pub-id>
          <pub-id pub-id-type="pii">S0277-9536(20)30633-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7537647</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>EY</given-names>
            </name>
            <name name-style="western">
              <surname>Yeoh</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>SY</given-names>
            </name>
          </person-group>
          <article-title>Intention of nurses to accept coronavirus disease 2019 vaccination and change of intention to accept seasonal influenza vaccination during the coronavirus disease 2019 pandemic: a cross-sectional survey</article-title>
          <source>Vaccine</source>
          <year>2020</year>
          <month>10</month>
          <day>21</day>
          <volume>38</volume>
          <issue>45</issue>
          <fpage>7049</fpage>
          <lpage>56</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32980199"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2020.09.021</pub-id>
          <pub-id pub-id-type="medline">32980199</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(20)31175-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7834255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ruiz</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Predictors of intention to vaccinate against COVID-19: results of a nationwide survey</article-title>
          <source>Vaccine</source>
          <year>2021</year>
          <month>03</month>
          <day>12</day>
          <volume>39</volume>
          <issue>7</issue>
          <fpage>1080</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33461833"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2021.01.010</pub-id>
          <pub-id pub-id-type="medline">33461833</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(21)00014-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7794597</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arigo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pagoto</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carter-Harris</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lillie</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Nebeker</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Using social media for health research: methodological and ethical considerations for recruitment and intervention delivery</article-title>
          <source>Digit Health</source>
          <year>2018</year>
          <month>05</month>
          <day>07</day>
          <volume>4</volume>
          <fpage>2055207618771757</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/abs/10.1177/2055207618771757?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2055207618771757</pub-id>
          <pub-id pub-id-type="medline">29942634</pub-id>
          <pub-id pub-id-type="pii">10.1177_2055207618771757</pub-id>
          <pub-id pub-id-type="pmcid">PMC6016568</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sigalo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Awasthi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Abrar</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Frias-Martinez</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Using COVID-19 vaccine attitudes on Twitter to improve vaccine uptake forecast models in the United States: infodemiology study of Tweets</article-title>
          <source>JMIR Infodemiology</source>
          <year>2023</year>
          <month>08</month>
          <day>21</day>
          <volume>3</volume>
          <fpage>e43703</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2023//e43703/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/43703</pub-id>
          <pub-id pub-id-type="medline">37390402</pub-id>
          <pub-id pub-id-type="pii">v3i1e43703</pub-id>
          <pub-id pub-id-type="pmcid">PMC10477926</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>KB</given-names>
            </name>
          </person-group>
          <article-title>Researching internet-based populations: advantages and disadvantages of online survey research, online questionnaire authoring software packages, and web survey services</article-title>
          <source>J Comput Mediat Commun</source>
          <year>2005</year>
          <month>4</month>
          <day>1</day>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>JCMC1034</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/jcmc/article/10/3/JCMC1034/4614509"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1083-6101.2005.tb00259.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Enriquez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>COVID-19’s socioeconomic impact on low-income benefit recipients: early evidence from tracking surveys</article-title>
          <source>Socius</source>
          <year>2020</year>
          <month>11</month>
          <day>25</day>
          <volume>6</volume>
          <fpage>237802312097079</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/2378023120970794"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2378023120970794</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>DX</given-names>
            </name>
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Beltran</surname>
              <given-names>TF</given-names>
            </name>
          </person-group>
          <article-title>Food insecurity in households with children amid the COVID-19 pandemic: evidence from the household pulse survey</article-title>
          <source>Soc Curr</source>
          <year>2021</year>
          <month>04</month>
          <day>23</day>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>314</fpage>
          <lpage>25</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/23294965211011593"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/23294965211011593</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <article-title>Household pulse survey technical documentation</article-title>
          <source>United States Census Bureau</source>
          <access-date>2023-05-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/programs-surveys/household-pulse-survey/technical-documentation.html">https://www.census.gov/programs-surveys/household-pulse-survey/technical-documentation.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daly</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Public trust and willingness to vaccinate against COVID-19 in the US from October 14, 2020, to March 29, 2021</article-title>
          <source>JAMA</source>
          <year>2021</year>
          <month>06</month>
          <day>15</day>
          <volume>325</volume>
          <issue>23</issue>
          <fpage>2397</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34028495"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2021.8246</pub-id>
          <pub-id pub-id-type="medline">34028495</pub-id>
          <pub-id pub-id-type="pii">2780519</pub-id>
          <pub-id pub-id-type="pmcid">PMC8145162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silge</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>tidytext: text mining and analysis using tidy data principles in R</article-title>
          <source>J Open Source Softw</source>
          <year>2016</year>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>37</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.theoj.org/joss-papers/joss.00037/10.21105.joss.00037.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.21105/joss.00037</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <article-title>NRC word-emotion association lexicon</article-title>
          <source>NRC Emotion Lexicon</source>
          <access-date>2022-01-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://saifmohammad.com/WebPages/NRC-Emotion-Lexicon.htm">http://saifmohammad.com/WebPages/NRC-Emotion-Lexicon.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kausar</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Soosaimanickam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nasar</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Public sentiment analysis on Twitter data during COVID-19 outbreak</article-title>
          <source>Int J Adv Comput Sci Appl</source>
          <year>2021</year>
          <volume>12</volume>
          <issue>2</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://thesai.org/Downloads/Volume12No2/Paper_52-Public_Sentiment_Analysis_on_Twitter_Data.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.14569/IJACSA.2021.0120252</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeileis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cribari-Neto</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Gruen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kosmidis</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Simas</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Rocha</surname>
              <given-names>AV</given-names>
            </name>
          </person-group>
          <article-title>Package ‘betareg’</article-title>
          <source>The Comprehensive R Archive Network</source>
          <year>2022</year>
          <month>10</month>
          <day>12</day>
          <access-date>2023-11-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/betareg/betareg.pdf">https://cran.r-project.org/web/packages/betareg/betareg.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rizopoulos</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>GLMMadaptive: generalized linear mixed models using adaptive gaussian quadrature</article-title>
          <source>The Comprehensive R Archive Network</source>
          <year>2023</year>
          <access-date>2023-05-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cloud.r-project.org/web/packages/GLMMadaptive/index.html">https://cloud.r-project.org/web/packages/GLMMadaptive/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lingsma</surname>
              <given-names>HF</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Lesaffre</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Logistic random effects regression models: a comparison of statistical packages for binary and ordinal outcomes</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2011</year>
          <month>05</month>
          <day>23</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>77</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-11-77"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2288-11-77</pub-id>
          <pub-id pub-id-type="medline">21605357</pub-id>
          <pub-id pub-id-type="pii">1471-2288-11-77</pub-id>
          <pub-id pub-id-type="pmcid">PMC3112198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>XA</given-names>
            </name>
            <name name-style="western">
              <surname>Donaldson</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Correa-Cano</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>DN</given-names>
            </name>
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Hodgson</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Inger</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A brief introduction to mixed effects modelling and multi-model inference in ecology</article-title>
          <source>PeerJ</source>
          <year>2018</year>
          <month>5</month>
          <day>23</day>
          <volume>6</volume>
          <fpage>e4794</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29844961"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj.4794</pub-id>
          <pub-id pub-id-type="medline">29844961</pub-id>
          <pub-id pub-id-type="pii">4794</pub-id>
          <pub-id pub-id-type="pmcid">PMC5970551</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Berkout</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Lindhiem</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Analyzing proportion scores as outcomes for prevention trials: a statistical primer</article-title>
          <source>Prev Sci</source>
          <year>2017</year>
          <month>04</month>
          <volume>18</volume>
          <issue>3</issue>
          <fpage>312</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26960687"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11121-016-0643-6</pub-id>
          <pub-id pub-id-type="medline">26960687</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11121-016-0643-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC5860877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <source>IRB Definitions</source>
          <access-date>2023-11-27</access-date>
          <publisher-name>Division of Research - University of Maryland</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://research.umd.edu/resources/research-compliance/institutional-review-board-irb/irb-definitions">https://research.umd.edu/resources/research-compliance/institutional-review-board-irb/irb-definitions</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Heymann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Szabo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Apas Vasandani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khubchandani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>DiLorenzo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Coffee</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Exploring coronavirus disease 2019 vaccine hesitancy on Twitter using sentiment analysis and natural language processing algorithms</article-title>
          <source>Clin Infect Dis</source>
          <year>2022</year>
          <month>05</month>
          <day>15</day>
          <volume>74</volume>
          <issue>Suppl_3</issue>
          <fpage>e4</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1093/cid/ciac141</pub-id>
          <pub-id pub-id-type="medline">35568473</pub-id>
          <pub-id pub-id-type="pii">6585957</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reichert</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brüßler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Reinhard</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Giurgiu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hoell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zipf</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer-Lindenberg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tost</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ebner-Priemer</surname>
              <given-names>UW</given-names>
            </name>
          </person-group>
          <article-title>The association of stress and physical activity: mind the ecological fallacy</article-title>
          <source>Ger J Exerc Sport Res</source>
          <year>2022</year>
          <month>05</month>
          <day>06</day>
          <volume>52</volume>
          <issue>2</issue>
          <fpage>282</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/article/10.1007/s12662-022-00823-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12662-022-00823-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A literature review of online identity reconstruction</article-title>
          <source>Front Psychol</source>
          <year>2021</year>
          <month>08</month>
          <day>23</day>
          <volume>12</volume>
          <fpage>696552</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34497560"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyg.2021.696552</pub-id>
          <pub-id pub-id-type="medline">34497560</pub-id>
          <pub-id pub-id-type="pmcid">PMC8419451</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>H-W</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Examining knowledge contribution from the perspective of an online identity in blogging communities</article-title>
          <source>Comput Hum Behav</source>
          <year>2011</year>
          <month>9</month>
          <volume>27</volume>
          <issue>5</issue>
          <fpage>1760</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S0747563211000616?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chb.2011.03.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Achieving self-congruency? Examining why individuals reconstruct their virtual identity in communities of interest established within social network platforms</article-title>
          <source>Comput Hum Behav</source>
          <year>2015</year>
          <month>09</month>
          <volume>50</volume>
          <fpage>465</fpage>
          <lpage>75</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S0747563215003143?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chb.2015.04.027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bargh</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>McKenna</surname>
              <given-names>KY</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzsimons</surname>
              <given-names>GM</given-names>
            </name>
          </person-group>
          <article-title>Can you see the real me? Activation and expression of the “true self” on the internet</article-title>
          <source>J Soc Issues</source>
          <year>2002</year>
          <month>12</month>
          <day>17</day>
          <volume>58</volume>
          <issue>1</issue>
          <fpage>33</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.1111/1540-4560.00247</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Donath</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Kollock</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Identity and deception in the virtual community</article-title>
          <source>Communities in Cyberspace</source>
          <year>1998</year>
          <month>12</month>
          <day>17</day>
          <publisher-loc>London, UK</publisher-loc>
          <publisher-name>Routledge</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schau</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gilly</surname>
              <given-names>MC</given-names>
            </name>
          </person-group>
          <article-title>We are what we post? Self-presentation in personal web space</article-title>
          <source>J Consum Res</source>
          <year>2003</year>
          <month>12</month>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>385</fpage>
          <lpage>404</lpage>
          <pub-id pub-id-type="doi">10.1086/378616</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Govindan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Balakrishnan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>A machine learning approach in analysing the effect of hyperboles using negative sentiment tweets for sarcasm detection</article-title>
          <source>J King Saud Univ Comput Inf Sci</source>
          <year>2022</year>
          <month>09</month>
          <volume>34</volume>
          <issue>8</issue>
          <fpage>5110</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/S1319157822000210?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jksuci.2022.01.008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morland</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Filomena</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Disparities in the availability of fruits and vegetables between racially segregated urban neighbourhoods</article-title>
          <source>Public Health Nutr</source>
          <year>2007</year>
          <month>12</month>
          <volume>10</volume>
          <issue>12</issue>
          <fpage>1481</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1017/S1368980007000079</pub-id>
          <pub-id pub-id-type="medline">17582241</pub-id>
          <pub-id pub-id-type="pii">S1368980007000079</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Sloane</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Nascimento</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Diamant</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Guinyard</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yancey</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Flynn</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>African Americans' access to healthy food options in South Los Angeles restaurants</article-title>
          <source>Am J Public Health</source>
          <year>2005</year>
          <month>04</month>
          <volume>95</volume>
          <issue>4</issue>
          <fpage>668</fpage>
          <lpage>73</lpage>
          <pub-id pub-id-type="doi">10.2105/AJPH.2004.050260</pub-id>
          <pub-id pub-id-type="medline">15798128</pub-id>
          <pub-id pub-id-type="pii">95/4/668</pub-id>
          <pub-id pub-id-type="pmcid">PMC1449239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sigalo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>St Jean</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Frias-Martinez</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Using social media to predict food deserts in the United States: infodemiology study of tweets</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2022</year>
          <month>07</month>
          <day>05</day>
          <volume>8</volume>
          <issue>7</issue>
          <fpage>e34285</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2022/7/e34285/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/34285</pub-id>
          <pub-id pub-id-type="medline">35788108</pub-id>
          <pub-id pub-id-type="pii">v8i7e34285</pub-id>
          <pub-id pub-id-type="pmcid">PMC9297137</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sattar</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Arifuzzaman</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccination awareness and aftermath: public sentiment analysis on Twitter data and vaccinated population prediction in the USA</article-title>
          <source>Appl Sci</source>
          <year>2021</year>
          <month>06</month>
          <day>30</day>
          <volume>11</volume>
          <issue>13</issue>
          <fpage>6128</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/2076-3417/11/13/6128"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/app11136128</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Public attitudes toward COVID-19 vaccines on English-language Twitter: a sentiment analysis</article-title>
          <source>Vaccine</source>
          <year>2021</year>
          <month>09</month>
          <day>15</day>
          <volume>39</volume>
          <issue>39</issue>
          <fpage>5499</fpage>
          <lpage>505</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34452774"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2021.08.058</pub-id>
          <pub-id pub-id-type="medline">34452774</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(21)01106-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC8439574</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tahir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gogate</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dashtipour</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence-enabled analysis of public attitudes on Facebook and Twitter toward COVID-19 vaccines in the United Kingdom and the United States: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>04</month>
          <day>05</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>e26627</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/4/e26627/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26627</pub-id>
          <pub-id pub-id-type="medline">33724919</pub-id>
          <pub-id pub-id-type="pii">v23i4e26627</pub-id>
          <pub-id pub-id-type="pmcid">PMC8023383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yousefinaghani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mubareka</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Papadopoulos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sharif</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An analysis of COVID-19 vaccine sentiments and opinions on Twitter</article-title>
          <source>Int J Infect Dis</source>
          <year>2021</year>
          <month>07</month>
          <volume>108</volume>
          <fpage>256</fpage>
          <lpage>62</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1201-9712(21)00462-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijid.2021.05.059</pub-id>
          <pub-id pub-id-type="medline">34052407</pub-id>
          <pub-id pub-id-type="pii">S1201-9712(21)00462-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8157498</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyu</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Luli</surname>
              <given-names>GK</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccine-related discussion on Twitter: topic modeling and sentiment analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>06</month>
          <day>29</day>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>e24435</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/6/e24435/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24435</pub-id>
          <pub-id pub-id-type="medline">34115608</pub-id>
          <pub-id pub-id-type="pii">v23i6e24435</pub-id>
          <pub-id pub-id-type="pmcid">PMC8244724</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freedman</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>Local food environments: they're all stocked differently</article-title>
          <source>Am J Community Psychol</source>
          <year>2009</year>
          <month>12</month>
          <volume>44</volume>
          <issue>3-4</issue>
          <fpage>382</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1007/s10464-009-9272-6</pub-id>
          <pub-id pub-id-type="medline">19838789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>QC</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>H-W</given-names>
            </name>
            <name name-style="western">
              <surname>Kath</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nsoesie</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Building a national neighborhood dataset from geotagged Twitter data for indicators of happiness, diet, and physical activity</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2016</year>
          <month>10</month>
          <day>17</day>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e158</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2016/2/e158/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.5869</pub-id>
          <pub-id pub-id-type="medline">27751984</pub-id>
          <pub-id pub-id-type="pii">v2i2e158</pub-id>
          <pub-id pub-id-type="pmcid">PMC5088343</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bradley</surname>
              <given-names>VC</given-names>
            </name>
            <name name-style="western">
              <surname>Kuriwaki</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Isakov</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sejdinovic</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>X-L</given-names>
            </name>
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Unrepresentative big surveys significantly overestimated US vaccine uptake</article-title>
          <source>Nature</source>
          <year>2021</year>
          <month>12</month>
          <volume>600</volume>
          <issue>7890</issue>
          <fpage>695</fpage>
          <lpage>700</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34880504"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-021-04198-4</pub-id>
          <pub-id pub-id-type="medline">34880504</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-021-04198-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8653636</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
