<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="review-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Infodemiology</journal-id>
      <journal-title>JMIR Infodemiology</journal-title>
      <issn pub-type="epub">2564-1891</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v4i1e51156</article-id>
      <article-id pub-id-type="pmid">39269743</article-id>
      <article-id pub-id-type="doi">10.2196/51156</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>The Use of Natural Language Processing Methods in Reddit to Investigate Opioid Use: Scoping Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mackey</surname>
            <given-names>Tim</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Haupt</surname>
            <given-names>Michael</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chandrasekaran</surname>
            <given-names>Ranganathan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Nguyen</surname>
            <given-names>Thu</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Almeida</surname>
            <given-names>Alexandra</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Scientific Computing Program</institution>
            <institution>Oswaldo Cruz Foundation</institution>
            <addr-line>Avenida Brasil, 4365, Antiga Residência Oficial Manguinhos</addr-line>
            <addr-line>Rio de Janeiro, 21045900</addr-line>
            <country>Brazil</country>
            <phone>55 213836 1212</phone>
            <email>alexandra.almeida@fiocruz.br</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2092-5070</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Patton</surname>
            <given-names>Thomas</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5134-3308</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Conway</surname>
            <given-names>Mike</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3209-8108</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Gupta</surname>
            <given-names>Amarnath</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0897-120X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Strathdee</surname>
            <given-names>Steffanie A</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7724-691X</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Bórquez</surname>
            <given-names>Annick</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6033-9837</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Scientific Computing Program</institution>
        <institution>Oswaldo Cruz Foundation</institution>
        <addr-line>Rio de Janeiro</addr-line>
        <country>Brazil</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>San Diego State University</institution>
        <institution>School of Social Work</institution>
        <addr-line>San Diego, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Medicine</institution>
        <institution>University of California San Diego</institution>
        <addr-line>San Diego, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>School of Computing and Information Systems</institution>
        <institution>The University of Melbourne</institution>
        <addr-line>Melbourne</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>San Diego Supercomputer Center</institution>
        <institution>University of California San Diego</institution>
        <addr-line>San Diego, CA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Alexandra Almeida <email>alexandra.almeida@fiocruz.br</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>13</day>
        <month>9</month>
        <year>2024</year>
      </pub-date>
      <volume>4</volume>
      <elocation-id>e51156</elocation-id>
      <history>
        <date date-type="received">
          <day>23</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>3</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>1</day>
          <month>6</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>18</day>
          <month>6</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Alexandra Almeida, Thomas Patton, Mike Conway, Amarnath Gupta, Steffanie A Strathdee, Annick Bórquez. Originally published in JMIR Infodemiology (https://infodemiology.jmir.org), 13.09.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Infodemiology, is properly cited. The complete bibliographic information, a link to the original publication on https://infodemiology.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://infodemiology.jmir.org/2024/1/e51156" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The growing availability of big data spontaneously generated by social media platforms allows us to leverage natural language processing (NLP) methods as valuable tools to understand the opioid crisis.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to understand how NLP has been applied to Reddit (Reddit Inc) data to study opioid use.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We systematically searched for peer-reviewed studies and conference abstracts in PubMed, Scopus, PsycINFO, ACL Anthology, IEEE Xplore, and Association for Computing Machinery data repositories up to July 19, 2022. Inclusion criteria were studies investigating opioid use, using NLP techniques to analyze the textual corpora, and using Reddit as the social media data source. We were specifically interested in mapping studies’ overarching goals and findings, methodologies and software used, and main limitations.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In total, 30 studies were included, which were classified into 4 nonmutually exclusive <italic>overarching goal</italic> categories: methodological (n=6, 20% studies), infodemiology (n=22, 73% studies), infoveillance (n=7, 23% studies), and pharmacovigilance (n=3, 10% studies). NLP methods were used to identify content relevant to opioid use among vast quantities of textual data, to establish potential relationships between opioid use patterns or profiles and contextual factors or comorbidities, and to anticipate individuals’ transitions between different opioid-related subreddits, likely revealing progression through opioid use stages. Most studies used an embedding technique (12/30, 40%), prediction or classification approach (12/30, 40%), topic modeling (9/30, 30%), and sentiment analysis (6/30, 20%). The most frequently used programming languages were Python (20/30, 67%) and R (2/30, 7%). Among the studies that reported limitations (20/30, 67%), the most cited was the uncertainty regarding whether redditors participating in these forums were representative of people who use opioids (8/20, 40%). The papers were very recent (28/30, 93%), from 2019 to 2022, with authors from a range of disciplines.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This scoping review identified a wide variety of NLP techniques and applications used to support surveillance and social media interventions addressing the opioid crisis. Despite the clear potential of these methods to enable the identification of opioid-relevant content in Reddit and its analysis, there are limits to the degree of interpretive meaning that they can provide. Moreover, we identified the need for standardized ethical guidelines to govern the use of Reddit data to safeguard the anonymity and privacy of people using these forums.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>opioid</kwd>
        <kwd>Reddit</kwd>
        <kwd>natural language processing</kwd>
        <kwd>NLP</kwd>
        <kwd>machine learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Opioid use disorder (OUD) is a chronic condition that affects more than 40 million people worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. In 2019, the Global Burden of Disease study estimated that 128,000 deaths were attributed to drug use disorders [<xref ref-type="bibr" rid="ref2">2</xref>], and the United States accounted for a large proportion of these deaths, with &#62;70,000 deaths directly attributable to overdose [<xref ref-type="bibr" rid="ref3">3</xref>]. US overdose deaths reached a record high in 2021, with 107,000 deaths, of which 75% were opioid related [<xref ref-type="bibr" rid="ref4">4</xref>]. The magnitude of these numbers highlights the need for a strong surveillance infrastructure, including systems that support tracking trends in drug use and emerging patterns in the drug supply chain, as well as a good understanding of the experiences of, challenges of, and sources of support for people who use opioids, to inform a timely and effective response to this ongoing epidemic.</p>
        <p>Social media platforms represent an important and accessible source of community support for people who use opioids, given they facilitate getting technical know-how and peer support. Nonetheless, analyzing such large textual data sets is challenging. Beyond the traditional qualitative approach to analyzing textual data, natural language processing (NLP) allows the analysis of textual data using computational methods and artificial intelligence. NLP lexicon-based methods and both supervised and unsupervised machine learning tools have been used to explore substance-related research questions on platforms such as Twitter (subsequently rebranded X; X Corp) [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref10">10</xref>], Reddit (Reddit Inc) [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>], and web-based health communities [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>In contrast with Reddit, which allows for long-form narratives, Twitter provides very condensed information for each data point since, historically, posts have been limited to 280 characters. An additional characteristic of tweets as a data type is that (at least in some cases) tweets contain metadata geolocational information, allowing for the ecological study of associations between the volume of mentions of a particular topic and a health outcome of interest in a given setting [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Facebook (Meta Platforms Inc) offers the advantage of providing information on social networks and the dissemination of information within these networks [<xref ref-type="bibr" rid="ref16">16</xref>]. However, Facebook data are not necessarily public in the same way that Twitter and Reddit data are public (ie, on the open web). Facebook users typically form closed and semiprivate communities in which there is an expectation of data privacy, rendering the data unsuitable (both practically and ethically) for research purposes, as a specific consent model and process is absent. Reddit is a publicly accessible social media platform, with forums created and moderated to discuss specific themes. Participants (ie, redditors) use the platform anonymity and “throwaway” user accounts to share news, content, and thoughts through posting. Redditors’ anonymity is key to authentic accounts of both positive and negative experiences with drugs (including in the context of treatment) and daily life situations that may impact the physical and mental health of people who use opioids, without fearing stigmatization. This platform is one of the most popular web-based social media platforms and has provided a space for exchange and discussion since 2005. It is mainly used by English speakers [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>Despite Twitter being the platform of choice for most studies [<xref ref-type="bibr" rid="ref18">18</xref>], Reddit thematic forums have shown to be an advantage for research on substance use, skipping the filtering stage of posts related to the research topic. NLP techniques enable the use of massive text corpora and the exploration of a multitude of research questions related to opioid use based on the perspectives of people sharing their experiences on social media platforms, such as Reddit.</p>
        <p>Reddit ranked as the third most visited website in the United States [<xref ref-type="bibr" rid="ref19">19</xref>], and in October 2020, it achieved &#62;52 million daily active users [<xref ref-type="bibr" rid="ref20">20</xref>]. Reddit has been used as a source of information to understand drug-related epidemics mainly due to the lower risk of social desirability bias, the real-time aspect of the data, and lower noise due to its thematic forums structure [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. Given that the majority of its users are from the United States (47.82%), United Kingdom (7.6%), Canada (7.45%), and Australia (3.89%) and that these countries are all undergoing severe opioid-related epidemics, Reddit represents a valuable source of data to better understand the daily experiences of people who use opioids in these settings [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>This scoping review aimed to understand how Reddit data have been leveraged to study the opioid epidemic using NLP to provide an overview of how these novel data sources and tools can serve the field of substance use research. More specifically, we were interested in mapping the studies’ (1) overarching goals and findings, (2) methodologies and software used, and (3) main limitations. In addition, to help future research in this area to deal with abbreviations, slang, and common misspellings, we systematically collected the papers’ list of synonyms and built a comprehensive synset with semantically equivalent terms within the opioid use field. This list could help the broader research community to rigorously investigate opioid use in Reddit using text processing algorithms.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>This scoping review followed the Joanna Briggs Institute (JBI) methodology for scoping reviews based on the studies by Arksey and O’Malley [<xref ref-type="bibr" rid="ref25">25</xref>] and Levac et al [<xref ref-type="bibr" rid="ref26">26</xref>]. We used the JBI population (or participants)/concept/context framework to guide our research questions and ultimately inform our search strategy to understand how NLP methods have been applied to Reddit data to inform research on opioid use. Our study protocol was registered on the Open Science Framework [<xref ref-type="bibr" rid="ref27">27</xref>] on June 29, 2022. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> details the JBI population (or participants)/concept/context framework rationale behind each research question of this scoping review.</p>
      </sec>
      <sec>
        <title>Search Strategy</title>
        <p>As the research topic encompasses studies targeting opioid use, we selected the following search engines: (1) PubMed to cover the biomedical literature; (2) Scopus to cover life, social, physical, and health sciences; (3) PsycINFO to cover the psychology field; and (4) ACL Anthology to cover NLP and computational linguistics. As the research team was aware of recent studies using NLP in the substance use field led mainly by authors from the engineering field, we also included IEEE Xplore and Association for Computing Machinery as data repositories for conference abstracts.</p>
        <p>Our search was built based on team members’ expertise in the topic and aimed to identify studies jointly covering three essential aspects: (1) opioid use, as the subject under analysis; (2) NLP techniques, as the methods used to analyze the textual corpora; and (3) Reddit, as the data source used in the study’s analyses. The terms used to capture opioid-related studies were based on standard terms describing opioids, including “heroin” and “fentanyl” as well as the National Institute on Drug Abuse’s list of most commonly prescribed opioids [<xref ref-type="bibr" rid="ref28">28</xref>] and medications for OUD (MOUD) [<xref ref-type="bibr" rid="ref29">29</xref>]. To ensure our search would only select studies that used a quantitative methodology to analyze the textual data (ie, NLP), we leveraged the “artificial intelligence” methods included in the Medical Subject Headings vocabulary thesaurus [<xref ref-type="bibr" rid="ref30">30</xref>], which we supplemented with members’ expertise in the topic to broaden our scope. As many essential papers in this field do not state “Reddit” as the social media environment under analysis in the abstract, and many search engines only consider the abstract (and not the full paper), we included the broad term “social media” in the search. <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> details the search strategy, presenting the Medical Subject Headings hierarchy and the final search query used to obtain relevant studies.</p>
        <p>We included papers that appeared in the search until July 19, 2022, with no cutoff for earlier studies. We selected original research papers published in English that stated that they collected textual data on opioid use from Reddit forums (even if other social media were also used) and specified they used NLP techniques to analyze these data.</p>
        <p>Our focus was on studies that applied quantitative techniques to textual data. NLP can use a variety of different methods, including rule-based methods (eg, linguistic rules, deployment of lexicons, and development of bespoke regular expressions) and machine learning–based methods (eg, supervised classification and sequence labeling–based methods and unsupervised methods). Therefore, studies that used manual annotation were only included if they also applied quantitative methods to analyze the textual data.</p>
        <p>Two researchers screened papers considering the title and abstract. If opioid use was not stated but the authors investigated substance use (eg, “...we evaluated attitudes of people who use substances<italic>...</italic>”), we included the papers for the second round of screening. If the methodology indicated any attempt to use NLP in any step of the study or if the authors were not specific about using only qualitative techniques (eg, “...we manually classified a set of posts<italic>...</italic>”), we included the paper. Finally, if the paper did not mention Reddit but was not specific about using another social media platform, we included it (eg, papers saying “...we evaluated Twitter data...” were excluded, whereas papers stating “...we used social media discussions to understand...” were included). The full-text review excluded the following: (1) review papers (to avoid double-counting); (2) papers solely using qualitative techniques or approaching substance use in general without any particular (or stratified) analysis for opioid-related information; and (3) papers not using Reddit as the data source. AA and TP independently screened for the title, abstract, and full paper. In both stages, when AA and TP diverged in their opinions about the papers’ eligibility, AB (a third reviewer blinded to their classification) decided on eligibility as a tiebreaker. Each reviewer was responsible for the data extraction of critical outcomes of interest.</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>We systematically extracted the following information: study’s year of publication; first author’s country of affiliation; authors’ areas of expertise; social media platforms investigated (in addition to Reddit); subreddit investigated; period under analysis; types of posts analyzed; number of posts analyzed; number of Reddit users represented; whether the analysis was limited to opioids and whether it distinguished between different types of opioids to infer the scope of the population investigated; whether the study attempted to have a geographic focus; whether the study described their semantic analysis to identify opioid-related terms and whether they provided a synset; study’s overarching goal, objectives, main findings, limitations, NLP methods and software used; and ethical approval information.</p>
        <p>We followed the PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews) [<xref ref-type="bibr" rid="ref31">31</xref>] guidelines to ensure methodological quality and clarity of the findings. The detailed PRISMA-ScR checklist describing the 20 essential and 2 optional reporting items is presented in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
      </sec>
      <sec>
        <title>Semantic Analysis and “Opioid Synset” Development</title>
        <p>To help further studies more efficiently address opioid-related research questions using social media data, we identified the different strategies used to carry out semantic analyses of opioid-related content, compiled their lists of opioid-related terms (produced either by automatic variant generator tools or by word embedding) or similar words, and curated their content, creating a refined version where the terms are aggregated by abbreviation, misspelling, variants and their misspellings, brand names and their misspellings, slang, analogues, and mixed substances.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Selection of Sources of Evidence</title>
        <p>The literature search returned 233 papers, of which 64 (27.4%) were duplicates, 128 (54.9%) were considered ineligible and were thus removed after the title and abstract screening, and 11 (4.7%) were similarly removed after the full-text screening, resulting in a final list of 30 papers. <xref rid="figure1" ref-type="fig">Figure 1</xref> displays the search process, following PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines [<xref ref-type="bibr" rid="ref32">32</xref>]. A table with a summary of all study findings is provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. Graphs illustrate the main results to give an overview of the literature studied.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Diagram of the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses)–oriented review process. ACM: Association for Computing Machinery; NLP: natural language processing. Note: Under “Studies included in Review,” some of the papers were available on more than one database.</p>
          </caption>
          <graphic xlink:href="infodemiology_v4i1e51156_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Studies’ Characteristics</title>
        <p>As detailed in <xref ref-type="table" rid="table1">Table 1</xref>, the number of studies applying NLP methods to data from Reddit forums to study opioid use has increased over time. Over half of the studies (19/30, 64%) were published in peer-reviewed journals, over a third (10/30, 33%) were published in conference proceedings, and 1 (3%) was published as a chapter in a book. Most studies (28/30, 93%) were disseminated in platforms with subject areas in computer science and health. Half of the studies (16/30, 53%) were exclusively concerned with opioids and OUD, while the remaining studies (14/30, 47%) were broader in scope (eg, substance use). However, content relating to other substances was sometimes referenced in the studies focused on opioids. For instance, the study by Preiss et al [<xref ref-type="bibr" rid="ref33">33</xref>] identified a broader range of substances used for self-medication among people experiencing opioid withdrawal symptoms.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary of characteristics of studies using natural language processing methods to investigate opioid use (N=30).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="470"/>
            <col width="0"/>
            <col width="470"/>
            <thead>
              <tr valign="top">
                <td colspan="4">Study characteristics</td>
                <td>Studies, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Year of publication</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">2017</td>
                <td>1 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">2018</td>
                <td>1 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">2019</td>
                <td>5 (17)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">2020</td>
                <td>6 (20)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">2021</td>
                <td>5 (17)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">2022</td>
                <td>12 (40)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Dissemination platform</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Peer-reviewed journal</td>
                <td>19 (64)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Conference proceedings</td>
                <td>10 (33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Book chapter</td>
                <td>1 (3)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Subject area of the dissemination platform</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Computer science</td>
                <td>10 (33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Health and medicine</td>
                <td>8 (27)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Both computer science and health and medicine</td>
                <td>10 (33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Other</td>
                <td>2 (7)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Range of substances considered</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Limited to opioids</td>
                <td>16 (53)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Distinction between different opioid types</td>
                <td>11 (37)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Software used for analysis<sup>a</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Not reported</td>
                <td>6 (20)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Python</bold>
                </td>
                <td>20 (66)</td>
              </tr>
              <tr valign="top">
                <td>
                </td>
                <td>
                  <break/>
                </td>
                <td>The Python Reddit API Wrapper</td>
                <td colspan="2">11 (37)</td>
              </tr>
              <tr valign="top">
                <td>
                </td>
                <td>
                  <break/>
                </td>
                <td>Gensim</td>
                <td colspan="2">4 (13)</td>
              </tr>
              <tr valign="top">
                <td>
                </td>
                <td>
                  <break/>
                </td>
                <td>spaCy</td>
                <td colspan="2">3 (10)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Linguistic Inquiry and Word Count</td>
                <td>2 (7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">R</td>
                <td>2 (7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">IBM Watson Natural Language Understanding</td>
                <td>1 (3)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Reported sources of research funding<sup>b</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Financial support not reported</td>
                <td>8 (27)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">National Science Foundation</td>
                <td>7 (23)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">National Institute on Drug Abuse</td>
                <td>5 (17)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Other (eg, institute-specific funding)</td>
                <td>4 (13)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Other institutes within the National Institutes of Health</td>
                <td>4 (13)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Centers for Disease Control and Prevention</td>
                <td>3 (10)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">No funding associated with the study</td>
                <td>2 (7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Natural Sciences and Engineering Research Council of Canada Discovery Grant</td>
                <td>1 (3)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Some studies used multiple software packages.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Some studies had multiple research grants.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Over a third (11/30, 37%) of the reviewed studies explicitly referred to specific opioid types in the research methodology. The content under analysis varied as some studies focused on specific elements of posts, such as the title, the first submission, or the comments, with most of the papers that explained the unit of analysis using a combination of the first submission and comments (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). Python was the most common programming language used to analyze posting content, although alternative analysis methods and languages were also reported, including R, IBM Watson’s Natural Language Understanding application, and Linguistic Inquiry and Word Count software.</p>
        <p>In total, 8 (N=30, 27%) studies did not report any sources of funding and another 2 (7%) studies reported that there was no funding associated with the research. Among the remaining studies, the most common source of funding was the National Science Foundation (7/30, 23% of studies) followed by the National Institute on Drug Abuse (5/30, 17% of studies). Furthermore, 5 sponsored grants were found to have supported multiple studies in the review. <xref ref-type="table" rid="table2">Table 2</xref> describes the authors from studies identified in the review, almost all (99/104, 95%) of whom were based in North America. The most common field of education among the authors, based on their terminal degree, was computer science (43/104, 41%). The studies analyzed more than 20 subreddits, most of which covered specific drugs and treatments, such as r/methadone and r/suboxone. However, the rooms with a broader scope and higher number of redditors, such as r/opiates and r/opiatesrecovery, were more frequently used as data sources, in 19 (63%) and 18 (60%) studies, respectively (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Summary of researcher characteristics authoring studies using natural language processing methods to investigate opioid use (N=104).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="500"/>
            <col width="0"/>
            <col width="470"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Researcher characteristics</td>
                <td>Researchers, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Number of studies per researcher</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td colspan="2">90 (86.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td colspan="2">9 (8.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td colspan="2">5 (4.8)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Location</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>United States</td>
                <td colspan="2">92 (88.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Canada</td>
                <td colspan="2">7 (6.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Italy</td>
                <td colspan="2">4 (3.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Multiple locations (Australia and the United States)</td>
                <td colspan="2">1 (0.9)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Area of expertise (based on terminal degree)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Computer science</td>
                <td colspan="2">43 (41.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medicine</td>
                <td colspan="2">12 (11.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Health-related (eg, public health)</td>
                <td colspan="2">11 (10.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unclear</td>
                <td colspan="2">8 (7.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Data science or analytics or machine learning</td>
                <td colspan="2">5 (4.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Multidisciplinary</td>
                <td colspan="2">5 (4.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Psychology</td>
                <td colspan="2">5 (4.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Engineering</td>
                <td colspan="2">5 (4.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mathematics and statistics</td>
                <td colspan="2">3 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physics</td>
                <td colspan="2">2 (1.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Biology</td>
                <td colspan="2">1 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Chemistry</td>
                <td colspan="2">1 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Linguistics</td>
                <td colspan="2">1 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sociology</td>
                <td colspan="2">1 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Social work</td>
                <td colspan="2">1 (0.9)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Overarching Goal, Methods Used, and Main Findings</title>
        <p>To broadly characterize opioid-related research using Reddit data, we classified the studies according to their overarching goal. We divided them into four groups based on their contribution to the field: (1) methodological, (2) infodemiology, (3) infoveillance, and (4) pharmacovigilance. Methodological papers proposed novel NLP methods to analyze Reddit data or provide scientific tools. They apply these methods or tools to opioid use as an illustrative example but are not focused on this public health problem. Infodemiology, as defined by Eysenbach [<xref ref-type="bibr" rid="ref34">34</xref>], is a science analogous to traditional epidemiology but with information coming from electronic media and with the ultimate goal of informing public health actions. Infoveillance papers contemplate the “longitudinal tracking of infodemiology metrics for surveillance and trend analysis” [<xref ref-type="bibr" rid="ref35">35</xref>]. Pharmacovigilance covers the detection of new drugs and the surveillance of drugs and their adverse effects [<xref ref-type="bibr" rid="ref36">36</xref>]. The papers’ classification followed the procedures adopted in the study’s screening process: AA and TP independently classified the papers according to their overarching goal, and any divergence was discussed and resolved by AB as a tiebreaker.</p>
        <p>The number of studies published each year by overarching goals is presented in <xref rid="figure2" ref-type="fig">Figure 2</xref>, where we can see the increased volume and diversity of overarching goals over time. Studies could address more than one overarching goal; therefore, the cumulative number of studies represented is higher than the total number of studies included in the review.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Number of studies investigating opioid use per year using Reddit data and studies’ overarching goals (each study could address more than 1 overarching goal).</p>
          </caption>
          <graphic xlink:href="infodemiology_v4i1e51156_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Methodological Studies</title>
        <p>In total, 6 (20%) studies were classified as methodological studies. Adams et al [<xref ref-type="bibr" rid="ref37">37</xref>] compared Reddit and Twitter as sources of social media information relevant to opioid use and to improve keyword synonym lists for drug-term exploration using embedding techniques. They found that Reddit is better than Twitter as a source for discovering synonyms to be included in a keyword filter list for opioids. Akioyamen et al [<xref ref-type="bibr" rid="ref38">38</xref>] provided ways for users to navigate Reddit posts to find the content of their interest using topic modeling and showed that text mining could play a fundamental role in supporting the identification of similar documents. Davis et al [<xref ref-type="bibr" rid="ref39">39</xref>] proposed an archetype-based modeling and search method to identify messages from people who use opioids through learning from their usual vocabulary, which solicits documents from a user and finds similar documents posted by new authors based on the vocabulary. Jha and Singh [<xref ref-type="bibr" rid="ref40">40</xref>] used a set of NLP techniques, including topic modeling, sentiment analysis, and propensity score matching to extract, treat, and analyze social media textual data on legal and illegal drugs to make it available to the academic community through a web application called SMARTS. Wright et al [<xref ref-type="bibr" rid="ref19">19</xref>] developed new measures to detect changes in words’ meaning and their association with overdose by applying word embedding and neural network techniques and found that the semantic proximity of fentanyl moved more closely to overdose and overdose-related terms over time. Zhu and Bhat [<xref ref-type="bibr" rid="ref41">41</xref>] proposed a novel method to identify euphemisms or nicknames for drugs using single and multiwords embedding techniques. The new approach, known as euphemistic phrase detection, was reported to have higher detection accuracies compared to alternative methods.</p>
      </sec>
      <sec>
        <title>Infodemiology Studies</title>
        <p>Of the 22 studies classified as infodemiology, 7 (31%) explored associations: Andy [<xref ref-type="bibr" rid="ref42">42</xref>] investigated correlations between different types of self-disclosures (positive and negative) and social support seeking (emotional and informational). The results showed that correlations between positive self-disclosure and emotional support seeking were moderate to strong, while those between negative self-disclosure and informational support seeking were low to moderate. Balsamo et al [<xref ref-type="bibr" rid="ref43">43</xref>] estimated the odds ratio between opioid use and (1) routes of administration and (2) drug-tampering methods and routes of administration and drug-tampering procedures. Their findings suggest that substances were consumed in multiple, nonexclusive ways. Jha and Singh [<xref ref-type="bibr" rid="ref44">44</xref>] explored associations between various latent constructs, addiction recovery, and relapse (defined as posted by users in drug addiction recovery [DAR] forums). Latent constructs capturing emotional distress, physical pain, self-development activities, and social relationships were all significantly associated with addiction recovery (ie, if a user posted in a DAR subreddit). Latent constructs capturing social activities and physical exercise were significantly associated with addiction relapse (ie, if a user posted in a recreational drug use subreddit after posting in a DAR subreddit).</p>
        <p>Spadaro et al [<xref ref-type="bibr" rid="ref45">45</xref>] explored associations between buprenorphine induction, fentanyl use, and precipitated opioid withdrawal. The paper found a relationship between increased mentions of fentanyl and its analogues with (1) increased mentions of precipitated opioid withdrawal and (2) increased mentions of the Bernese method (a microdosing strategy for buprenorphine induction). Pandrekar et al [<xref ref-type="bibr" rid="ref46">46</xref>] evaluated the association between posts of social support (measured by the number of comments and the difference between upvotes and downvotes received) and the attributes of those posts, including the use of specific terms, the semantic categories observed, and posts’ length. These analyses suggested that posts on personal issues like family, death, and home are positively associated with increased social support. Pandrekar et al [<xref ref-type="bibr" rid="ref46">46</xref>] also explored the differences between posts from anonymous and nonanonymous users, with the former being more likely to discuss negative emotions like anxiety and sadness and containing words related to health and risk. Andy and Guntuku [<xref ref-type="bibr" rid="ref47">47</xref>] explored the relationship between social support and the number of comments received using a mix of topic modeling and sentiment and correlation analysis. Their results showed that the average number of comments received was (1) positively associated with emotional support seeking and (2) negatively associated with information support seeking. Finally, Alambo et al [<xref ref-type="bibr" rid="ref48">48</xref>] explored topical correlations between postings on substance use disorders and COVID-19 between May 2020 and Sep 2020. The results showed that these correlations fluctuated over time.</p>
        <p>In total, 4 (18%) studies used discovery techniques to unveil patterns in the data. Ramachandran et al [<xref ref-type="bibr" rid="ref49">49</xref>] used sentiment analysis and ANOVA to explore the public perceptions of the opioid epidemic. The results showed an overall negative sentiment with slight variation in emotional tones across different subreddits. Gauthier et al [<xref ref-type="bibr" rid="ref50">50</xref>] tried to understand how Reddit communities support recovery using a topic-guided thematic analysis. The findings showed that community members often raised concerns about sensitive issues, such as withdrawal symptoms, body weight, legal troubles, and personal finances, and they encouraged others to seek help and navigate 12-step programs. Chen et al [<xref ref-type="bibr" rid="ref51">51</xref>] used topic modeling to explore stigma-related experiences associated with substance use. This study found topics related to negative feelings, the challenges of coping with withdrawal symptoms, dealing with others during the recovery process, and dealing with chronic pain. Graves et al [<xref ref-type="bibr" rid="ref52">52</xref>] used manual annotation and lexical similarity filter to yield information about firsthand experiences with buprenorphine-naloxone. They showed that the most frequently discussed topics included advice on the use of buprenorphine-naloxone as pharmacological treatment for OUD, information and guidance on dosage, information about tapering of dosage, its side effects and withdrawal information, and specific questions about use.</p>
        <p>In total, 11 (50%) infodemiology studies targeted the prediction or classification of people along the OUD continuum. A common theme in these studies was the prediction of redditors’ transitions between drug use, help seeking, and recovery stages. Furthermore, 2 (18%) studies developed models to predict whether redditors would post in a recovery subreddit based on their nonrecovery subreddit activities [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref54">54</xref>]. Another 2 (18%) studies developed models to predict relapse, albeit in different ways. Jha et al [<xref ref-type="bibr" rid="ref55">55</xref>] predicted the likelihood of changes in the content of users’ posts indicative of relapse. Yang et al [<xref ref-type="bibr" rid="ref56">56</xref>] predicted substance use relapse in the following week using manually labeled data to identify instances where redditors self-reported experiencing a relapse. Relapse prediction was based on emotions detected in redditors’ previous posting activities.</p>
        <p>Among the remaining prediction or classification studies, 4 (36%) assessed the predictive performance of classification models for sorting Reddit content into groups. Davis et al [<xref ref-type="bibr" rid="ref39">39</xref>] compared various classification models to predict whether redditors’ posts indicated opioid use and found that the linear support vector machine model yielded the best performance. Yao et al [<xref ref-type="bibr" rid="ref57">57</xref>] developed 2 sets of classifiers aiming to extract suicide risk posts from an opioid use context and extract opioid addiction posts from a suicidal ideation context. The former analysis yielded results showing (1) prediction accuracy and optimal model specification of classifiers varying with the percentage of suicide risk labels and (2) classifiers with better accuracy compared to those extracting opioid addiction posts from a suicidal ideation context. Chancellor et al [<xref ref-type="bibr" rid="ref58">58</xref>] developed a classification model to determine whether a post was about OUD recovery. Another study [<xref ref-type="bibr" rid="ref59">59</xref>] presented two classifiers that (1) sorted redditors into OUD and non-OUD groups according to their posting content and (2) determined whether those in the OUD group exhibited evidence of being in a positive recovery process. ElSherief et al [<xref ref-type="bibr" rid="ref60">60</xref>] developed a classifier to identify posts related to a common myth that using MOUD is simply replacing one drug with another, which may discourage people from seeking this evidence-based treatment.</p>
        <p>A study by Andy [<xref ref-type="bibr" rid="ref42">42</xref>] assessed the predictive performance of models developed to measure the degree of positive and negative self-disclosure of post titles. The model outputs were compared to annotator ratings. Another study by Andy and Guntuku [<xref ref-type="bibr" rid="ref47">47</xref>] compared the predictive performance of random forest models developed to measure the degree of social and informational support seeking expressed in post titles. They showed that the type of social support in post titles varies according to the substance use recovery forum.</p>
      </sec>
      <sec>
        <title>Infoveillance Studies</title>
        <p>In total, 7 (23%) papers were classified as an infoveillance study. Alambo et al [<xref ref-type="bibr" rid="ref48">48</xref>] estimated the longitudinal topical correlation between substance use or mental health and COVID-19–related posts through the COVID-19 pandemic, finding that this correlation peaked after August 2020. Balsamo et al [<xref ref-type="bibr" rid="ref43">43</xref>] traced the temporal evolution of posts from 2014 to 2018 relating to nonmedical consumption patterns, administration routes, and drug tampering. Their findings showed that mentions of heroin and hydrocodone decreased over time, mentions of buprenorphine and oxycodone remained relatively static, and mentions of fentanyl and codeine increased. El-Bassel et al [<xref ref-type="bibr" rid="ref22">22</xref>] explored the COVID-19 period, from March to May 2020, and revealed the topics discussed in opioid-related subreddits and how they changed over time. There was a decrease in conversation on the topic referred to as “supply shutdown,” gradual reductions in discussions on MOUD experiences and access issues, and increases in conversations on the negative consequences of OUD. Sarker et al [<xref ref-type="bibr" rid="ref61">61</xref>] used the lexical variant generation model to examine stimulant co-mention trends among people who use opioids and people using MOUD and found that the number and proportion of redditors mentioning both increased steadily over time.</p>
        <p>Pandrekar et al [<xref ref-type="bibr" rid="ref46">46</xref>] analyzed the main psychological categories (ie, relativity, cognitive processes, social words, drives, affect words, biological processes, percept, and informal speech) of the posts from the r/opiates subreddit between 2014 and 2017 and showed that posts on personal issues tend to receive more social support. Sarker et al [<xref ref-type="bibr" rid="ref23">23</xref>] compared pre– and post–COVID-19 monthly discussions on drug use, treatment access, care, and withdrawal. The results showed an increase in posts discussing withdrawal, treatment, and access to care from pre– to post–COVID-19 periods. Finally, a study by Sumner et al [<xref ref-type="bibr" rid="ref62">62</xref>] used a time series regression with the least absolute shrinkage and selection operator approach to predict opioid overdose deaths (from CDC WONDER), using Twitter and Reddit post volume as predictor variables.</p>
      </sec>
      <sec>
        <title>Pharmacovigilance Studies</title>
        <p>In total, 3 (10%) studies were classified as a pharmacovigilance study. Chancellor et al [<xref ref-type="bibr" rid="ref58">58</xref>] identified alternative drugs for treating OUD using word embeddings. The top 5 most frequently observed potential treatments were kratom, loperamide, Xanax, Valium, and Klonopin. Preiss et al [<xref ref-type="bibr" rid="ref33">33</xref>] aimed to find medications to cope with opioid withdrawal symptoms based on observed correlations between text entities identified within posts relating to withdrawal symptoms and substances. Besides the ones already approved by the Food and Drug Administration or commonly used to treat symptoms, they found additional medicines considered potentially helpful (eg, gabapentin for body aches) and natural or home remedies (eg, ginger for nausea). Wright et al [<xref ref-type="bibr" rid="ref19">19</xref>] evaluated the semantic proximity of individual substances to “overdose” through the years, with fentanyl being found to experience the most significant changes as it moved more closely to overdose and overdose-related terms.</p>
        <p><xref ref-type="table" rid="table3">Table 3</xref> presents the selected studies, their overarching goal, the research question they address, and the NLP methods used. This can serve as a guide to help researchers studying substance use in formulating research questions that could be answered by applying NLP methods to Reddit data and to identify which NLP methods (and miscellaneous methods) to use in each case. To facilitate this process among researchers studying substance use with no expertise in NLP methods, we provide a brief description of these methods alongside examples of research questions they can answer in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. Full details on the data extracted for each study during the review process are provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Overarching goals, research questions, and methods for studies applying natural language processing methods to Reddit data to investigate opioid use.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="180"/>
            <col width="230"/>
            <col width="320"/>
            <col width="270"/>
            <thead>
              <tr valign="top">
                <td>Study</td>
                <td>Overarching goal</td>
                <td>Research question</td>
                <td>Methods</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Adams et al [<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>Methodological</td>
                <td>Drug term discovery</td>
                <td>Word embedding</td>
              </tr>
              <tr valign="top">
                <td>Akioyamen et al [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Methodological</td>
                <td>Combine methods to allow users to actively navigate through topics or posts of interest</td>
                <td>Topic modeling (LDA<sup>a</sup>) and sentiment analysis</td>
              </tr>
              <tr valign="top">
                <td>Jha and Singh [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>Methodological</td>
                <td>Develop a tool to analyze data from Reddit and Twitter and make it available to the academic community for use</td>
                <td>Topic modeling (LDA), sentiment analysis, and propensity score matching</td>
              </tr>
              <tr valign="top">
                <td>Zhu and Bhat [<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                <td>Methodological</td>
                <td>Produce a list of euphemistic phrase candidates that are used as substitutes for target keywords corresponding to drug names</td>
                <td>Phrase mining on a raw text corpus</td>
              </tr>
              <tr valign="top">
                <td>Davis et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>Methodological and infodemiology—prediction or classification</td>
                <td>Predict archetypes</td>
                <td>Archetype-based modeling and search</td>
              </tr>
              <tr valign="top">
                <td>Wright et al [<xref ref-type="bibr" rid="ref19">19</xref>]</td>
                <td>Methodological and pharmacovigilance</td>
                <td>Measure movements over time of the semantic proximity of substance-related terms to “overdose”</td>
                <td>Diachronic word embedding</td>
              </tr>
              <tr valign="top">
                <td>Jha and Singh [<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                <td>Infodemiology—associations</td>
                <td>Identify and quantify the relationship between emotional distress, physical pain, self-development, relationships, and geographic disparities versus drug addiction recovery and relapse</td>
                <td>Semantic-based analysis and structural equation modeling</td>
              </tr>
              <tr valign="top">
                <td>Spadaro et al [<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                <td>Infodemiology—associations</td>
                <td>Study potential associations between fentanyl, buprenorphine induction, and precipitated opioid withdrawal</td>
                <td>Annotation and term-frequency matrix</td>
              </tr>
              <tr valign="top">
                <td>Andy [<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                <td>Infodemiology-associations and infodemiology—prediction or classification</td>
                <td>Measure types of self-disclosures (ie, positive and negative) and social supports sought (ie, emotional and informational)</td>
                <td>Random forest and correlation analysis</td>
              </tr>
              <tr valign="top">
                <td>Andy and Guntuku [<xref ref-type="bibr" rid="ref47">47</xref>]</td>
                <td>Infodemiology-association and infodemiology—prediction or classification</td>
                <td>Determine the relationship between the social supports expressed in the titles of posts and the number of comments they receive</td>
                <td>Topic modeling (LDA) and sentiment analysis</td>
              </tr>
              <tr valign="top">
                <td>Alambo et al [<xref ref-type="bibr" rid="ref48">48</xref>]</td>
                <td>Infodemiology—associations and infoveillance</td>
                <td>Monitor trends of correlation between depression or substance use disorder and coronavirus posts</td>
                <td>Word embedding, topic modeling (LDA), and correlation analysis</td>
              </tr>
              <tr valign="top">
                <td>Balsamo et al [<xref ref-type="bibr" rid="ref43">43</xref>]</td>
                <td>Infodemiology—associations and infoveillance</td>
                <td>Characterize patterns and estimate correlations between routes of administration and drug tampering</td>
                <td>Word embedding and correlation analysis</td>
              </tr>
              <tr valign="top">
                <td>Pandrekar et al [<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                <td>Infodemiology—associations and infoveillance</td>
                <td>Understand posts’ psychological categories and examine the association between posts’ attributes and the social support received</td>
                <td>Topic modeling (LDA), semantic-based analysis, negative binomial, and Mann-Whitney U tests</td>
              </tr>
              <tr valign="top">
                <td>Ramachandran et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>Infodemiology—discovery</td>
                <td>Unveil public opinion on the opioid epidemic</td>
                <td>Sentiment analysis and ANOVA</td>
              </tr>
              <tr valign="top">
                <td>Gauthier et al [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>Infodemiology—discovery</td>
                <td>Understand how web-based communities support recovery</td>
                <td>Topic modeling (LDA) and thematic analysis</td>
              </tr>
              <tr valign="top">
                <td>Chen et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>Infodemiology—discovery</td>
                <td>Examine the nature of stigma-related experience related to substance use and the salient affective and temporal factors in the use of 3 substances (including opioids)</td>
                <td>Manual annotation and topic modeling (NMF<sup>b</sup>)</td>
              </tr>
              <tr valign="top">
                <td>Graves et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>Infodemiology—discovery</td>
                <td>Identify topics discussing firsthand experiences with buprenorphine-naloxone</td>
                <td>Manual annotation and lexical similarity filter</td>
              </tr>
              <tr valign="top">
                <td>ElSherief et al [<xref ref-type="bibr" rid="ref60">60</xref>]</td>
                <td>Infodemiology—prediction or classification</td>
                <td>Identify misinformation related to medications for opioid use disorder</td>
                <td>Bidirectional long short-term memory</td>
              </tr>
              <tr valign="top">
                <td>Eshleman et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>Infodemiology—prediction or classification</td>
                <td>Predict users’ propensity for seeking drug recovery interventions</td>
                <td>Word embedding and prediction or classification: K-NN<sup>c</sup>, K-NN, random forests, logistic regression, and naive Bayes.</td>
              </tr>
              <tr valign="top">
                <td>Jha et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>Infodemiology—prediction or classification</td>
                <td>Characterize addiction stages of opioid use from users’ social media posts</td>
                <td>Word embedding and a combination of bidirectional long short-term-memory networks and conditional random fields</td>
              </tr>
              <tr valign="top">
                <td>Lu et al [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>Infodemiology—prediction or classification</td>
                <td>Predict users’ transitions from casual drug discussion forums to drug recovery forums</td>
                <td>Word embedding, binary classifier, and Cox regression</td>
              </tr>
              <tr valign="top">
                <td>Yang et al [<xref ref-type="bibr" rid="ref59">59</xref>]</td>
                <td>Infodemiology—prediction or classification</td>
                <td>Predict relapse among people who use opioids</td>
                <td>Topic modeling (LDA), correlation analysis, sentiment analysis, and support vector machine</td>
              </tr>
              <tr valign="top">
                <td>Yang et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>Infodemiology—prediction or classification</td>
                <td>Predict opioid use disorder and recovery among people who use opioids</td>
                <td>Sentiment analysis, generative adversarial networks, and correlation analysis</td>
              </tr>
              <tr valign="top">
                <td>Yao et al [<xref ref-type="bibr" rid="ref57">57</xref>]</td>
                <td>Infodemiology—prediction or classification</td>
                <td>Identify posts of suicidality among people who use opioids</td>
                <td>Word embedding, convolutional neural network (also tested logistic regression, random forest, support vector machines, FastText, recurrent neural network, and attention-based bidirectional recurrent neural network)</td>
              </tr>
              <tr valign="top">
                <td>Chancellor et al [<xref ref-type="bibr" rid="ref58">58</xref>]</td>
                <td>Infodemiology—prediction or classification and pharmacovigilance</td>
                <td>Identify messages related to opioid use recovery and alternative treatments</td>
                <td>Binary transfer learning classifier and word embeddings</td>
              </tr>
              <tr valign="top">
                <td>El-Bassel et al [<xref ref-type="bibr" rid="ref22">22</xref>]</td>
                <td>Infoveillance</td>
                <td>Identify challenges faced by people who use opioids and how these change over time</td>
                <td>Word embedding and topic modeling (LDA)</td>
              </tr>
              <tr valign="top">
                <td>Sarker et al [<xref ref-type="bibr" rid="ref23">23</xref>]</td>
                <td>Infoveillance</td>
                <td>Identify prescription or illegal opioid use, describe opioid treatment access and care, and withdrawal</td>
                <td>Annotation and term-frequency matrix</td>
              </tr>
              <tr valign="top">
                <td>Sarker et al [<xref ref-type="bibr" rid="ref61">61</xref>]</td>
                <td>Infoveillance</td>
                <td>Examine stimulant comention trends among people who use opioids or receive medications for opioid use disorder.</td>
                <td>Generate lexical variants and negatives (LexExp<sup>d</sup> and NegEx<sup>e</sup>)</td>
              </tr>
              <tr valign="top">
                <td>Sumner et al [<xref ref-type="bibr" rid="ref62">62</xref>]</td>
                <td>Infoveillance</td>
                <td>Build a statistical model for estimating national opioid overdose deaths using multiple predictors, including data on the volume of Reddit posts mentioning heroin and synthetic opioids.</td>
                <td>Time-series analysis (LASSO<sup>f</sup>)</td>
              </tr>
              <tr valign="top">
                <td>Preiss et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>Pharmacovigilance</td>
                <td>Identify symptoms and remedies for opioid withdrawal</td>
                <td>Word embedding and named entity recognition</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>LDA: latent Dirichlet allocation.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>NMF: nonnegative matrix factorization.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>K-NN: K-nearest neighbors.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>c</sup>LexExp: unsupervised lexicon expansion system.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>d</sup>NegEx: negation detection algorithm.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>e</sup>LASSO: least absolute shrinkage and selection operator.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Scope of Substance Use Populations Considered and Distinction of Opioid Types</title>
        <p>The anonymity characteristic of Reddit data prevents any definitive description of the study participants, composed of individuals contributing and responding to the posts selected for analysis. Nonetheless, participation in subreddits implies an active personal engagement with the topic, and therefore most studies in this review presuppose that the data from posts represent the language, views, and experiences of people who use opioids. For instance, the study by Andy and Guntuku [<xref ref-type="bibr" rid="ref47">47</xref>] et al analyzed data to investigate the types of support sought by people recovering from OUD, which was assumed based on their activity in the r/OpiatesRecovery and r/suboxone subreddits. Furthermore, 4 (13%) other studies also made inferences about the drug use and recovery status of individual redditors based on the subreddits they were found to post in [<xref ref-type="bibr" rid="ref53">53</xref>-<xref ref-type="bibr" rid="ref55">55</xref>]. In total, 5 (17%) studies involved the manual inspection and labeling of a sample of posts to verify whether they were indicative of ongoing opioid use, recovery efforts, or a recent relapse [<xref ref-type="bibr" rid="ref55">55</xref>-<xref ref-type="bibr" rid="ref59">59</xref>]. Similarly, a study by Graves et al [<xref ref-type="bibr" rid="ref52">52</xref>] involved a manual thematic categorization of 200 posts by 3 separate researchers to determine whether the posts’ contents were indicative of personal experiences of buprenorphine-naloxone use. Another study by El-Bassel et al [<xref ref-type="bibr" rid="ref22">22</xref>] was more cautious in acknowledging that their data might not reflect the firsthand experiences of people using drugs, despite this being the purpose of their study. In all 5 studies, the posts were labeled by health or substance use researchers except for 1 study, relying on nonspecialist workers from Amazon Mechanical Turk [<xref ref-type="bibr" rid="ref57">57</xref>].</p>
      </sec>
      <sec>
        <title>Limitations Mentioned by the Authors</title>
        <p>In total, 20 (67%) studies reported limitations associated with the methods used or the results produced. The most commonly cited limitation was the uncertainty regarding the representativeness of the community of people discussing opioid use on Reddit to the broader population of people who use opioids [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref62">62</xref>]. A related set of limitations was the lack of information on the demographics and location of the study participants [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref50">50</xref>] and the inability to ascertain whether study participants had a clinical diagnosis of OUD [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]. Another limitation was the presumption that subreddits dedicated to opioid use and recovery would consistently provide relevant content. A manual review undertaken in the study by Yao et al [<xref ref-type="bibr" rid="ref57">57</xref>] showed that this was not true in many instances. Another study acknowledged that relying on thematic subreddits addressing substance use disorders disregards relevant content in nondrug use subreddits [<xref ref-type="bibr" rid="ref54">54</xref>].</p>
      </sec>
      <sec>
        <title>Semantic Analysis and “Opioid Synset” Development</title>
        <p>As Reddit forums are internet-based spaces used by people looking for information, advice, or simply to share experiences, the textual variation by colloquial terms (slang), misspellings, and abbreviations is frequent. This heterogeneity imposes a challenge for NLP methods.</p>
        <p>More recent studies have used NLP tools for automatic variant generation [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]. Some studies have used existing lists of slang terms derived from the Drug Enforcement Administration Drug Slang Code Words [<xref ref-type="bibr" rid="ref63">63</xref>], the Drug Abuse Ontology [<xref ref-type="bibr" rid="ref64">64</xref>], and the Urban Dictionary [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref65">65</xref>]. However, many of the papers have explored the potentialities of embedding words to deal with semantic variation. While some studies incorporated word embedding methods into the analysis [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref53">53</xref>-<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref57">57</xref>], others used this methodology with the ultimate (or intermediate) goal of expanding opioid-related vocabulary [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]. In this spirit, Zhu and Bhat [<xref ref-type="bibr" rid="ref41">41</xref>] proposed a multiword method to identify nonsingle word euphemisms for the drug use field.</p>
        <p>Despite the accessibility of word embeddings for document identification, it is important to emphasize that the outputs require expert curation to ensure precision in the meaning of the words used. This is because word embedding outcomes do not provide synonyms but words with similar representations. For example, in the study of Chancellor et al [<xref ref-type="bibr" rid="ref58">58</xref>], word embedding outcomes for fentanyl included morphine, heroin, or even ketamine. We systematically categorized opioid-related terms used and generated across selected studies to produce a comprehensive “opioid synset” and support research in this area (<xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>).</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>Ethics approval was reported for 2 (7%) of the studies [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref52">52</xref>], while a further 4 (13%) studies were granted exemptions from ethics reviews [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref62">62</xref>]. The studies’ dissemination vehicle did not seem to determine whether they included ethical considerations. About 45% (5/11) of the conference proceedings and books and 63% (12/19) of the peer-reviewed papers did not report obtaining ethical clearance or any type of action to protect participants. From the remaining 55% (6/11) of the conference proceedings and books, 2 (33%) submitted their projects to the Institutional review board (IRB) and had them approved or exempted, 2 (33%) used strategies to protect participants, such as paraphrasing, and 2 (33%) argued the studies did not qualify for the ethics board review. Of the 37% (7/19) of the peer-reviewed papers that reported some ethical considerations to protect participants’ privacy, 4 (57%) submitted their projects to the IRB and had them approved or exempted, and 3 (43%) argued the studies did not qualify for ethics board review. The papers’ ethical considerations are available in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Contributions and Potential of This Research</title>
        <p>This paper describes the small but growing body of research applying NLP methods to analyze content from Reddit relating to opioid use. We show that the existing literature is diverse in scope, as indicated by the combination of infodemiology, infoveillance, pharmacovigilance, and methodological studies’ overarching goals. The literature is also varied in terms of NLP methods used, which include word expansion techniques, topic models, and prediction or classification methods. We found that most studies have been led by researchers with training in computer science, which was also the leading subject area associated with the platforms used for their dissemination or publication. This trend might explain the high degree of emphasis placed on the conduct of methods-driven research in the literature that demonstrates the application of NLP methods in the context of OUD, as opposed to research being primarily motivated by a theory or hypotheses specific to OUD. Indeed, while some studies showcase NLP applications to Reddit data that could directly be used toward routine public health surveillance or interventions in the context of OUD, many studies presented NLP methodological development and used OUD as an opportune case study without considering their practical use or operationalization.</p>
        <p>Given our focus on leveraging big data and NLP methods to improve public health responses to the opioid crisis, we provide an overview of the key contributions that have been and could be achieved through further engagement with this research. Reddit has been increasingly used as a source of information to understand opioid use behaviors and their connections with other conditions. Significant problems inherent to the substance use field, including the identification and classification of participants’ membership along the OUD continuum and the longitudinal tracking of OUD-related metrics, have been robustly explored in studies, such as Jha et al [<xref ref-type="bibr" rid="ref55">55</xref>] and Alambo et al [<xref ref-type="bibr" rid="ref48">48</xref>].</p>
        <p>Compared to traditional qualitative studies that rely on recruiting and interviewing participants, studies using Reddit data provide temporal flexibility, enabling the retrospective investigation of particular periods of interest, bypassing recall bias, as well as longitudinal perspectives (which are rare in the context of qualitative studies actively engaging participants). The latter can include following redditor cohorts (ie, following the same individuals over time) [<xref ref-type="bibr" rid="ref53">53</xref>] or specific topics (including a mix of old and new redditors participating in that specific subreddit at each time point) [<xref ref-type="bibr" rid="ref23">23</xref>]. Indeed, the studies using Reddit data use Reddit data opportunistically, while traditional qualitative studies that actively engage participants are designed to answer specific research questions. Compared to studies using traditional qualitative methods to analyze Reddit data, we found that those studies using NLP methods identified similar topics. We identified 3 studies using qualitative thematic analysis on posts of the subreddits r/Opiates and r/OpiatesRecovery, during the peak months of the COVID-19 pandemic, March to May 2020 [<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>], which could be compared with the NLP-based study included in this scoping review using data from March to May 2020, from the subreddits r/opiates, r/OpiatesRecovery, r/suboxone, and r/Methadone [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
        <p>The qualitative study conducted by Krawczyk et al [<xref ref-type="bibr" rid="ref68">68</xref>], which explored the impact of changes imposed by the pandemic on OUD treatment access, found that people who use opioids were concerned about OUD treatment facilities’ closure, the transition to telehealth, inconsistency between methadone daily clinic requirements and exposure to COVID-19 risks, impressions on regulation changes for MOUD, and how the pandemic was impacting treatment motivation and progress. Bunting et al [<xref ref-type="bibr" rid="ref67">67</xref>] also qualitatively explored COVID-19 restrictions’ consequences on the daily lives of people who use opioids, such as social isolation and the consequent change in the social network, and how Reddit was used to ask for or offer advice. Finally, Arshonsky et al [<xref ref-type="bibr" rid="ref66">66</xref>] described psychological and behavioral coping strategies for withdrawal symptoms and cessation or reduction of opioid use.</p>
        <p>Comparatively, the paper by El-Bassel et al [<xref ref-type="bibr" rid="ref22">22</xref>] on NLP provided an overview of the main topics representing different concerns around OUD in the context of COVID-19 and its trend and changes as the pandemic evolved. It found similar access issues during the COVID-19 months, such as closed and overcrowded treatment centers, limited take-home doses, switching from methadone to buprenorphine treatment to avoid daily clinic visits, or switching from oral to injectable buprenorphine to avoid access barriers, financial barriers to access MOUD, helpfulness of telehealth, withdrawal issues originated by diminished drug supply and MOUD facilities’ closures, confusion if their symptoms were because of withdrawal or COVID-19 infection, stigmatization by health care providers, self-medication to keep in the recovery track, and home detox. Sarker et al [<xref ref-type="bibr" rid="ref23">23</xref>] also found similar topics during the COVID-19 pandemic to those reported by El-Bassel et al [<xref ref-type="bibr" rid="ref22">22</xref>] and by the 3 qualitative studies mentioned [<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>], with the bonus of following the relative frequency of themes associated with drug use, treatment and access, and withdrawal over time (ie, infoveillance). This suggests NLP methods can effectively identify key themes while saving time and covering larger textual corpora. A study purposefully designed to compare NLP versus traditional qualitative methods is needed to rigorously investigate the advantages and drawbacks of NLP methods.</p>
        <p>Given the complexity of the research questions, in general, researchers used a mix of NLP methods to address opioid-related problems. Traditional NLP methods, such as topic modeling, were used more frequently to discover aspects of opioid use behavior and follow them over time (infodemiology and infoveillance papers), whereas word embedding was often used to discover new drugs (pharmacovigilance) and in tandem with classification and prediction methods to detect people’s stage in the OUD continuum (infodemiology). In contrast, sentiment analysis was mostly used to infer redditor’s opinions and positioning about opioid use. Another important aspect of the studies analyzed in this scoping review is its implications for public health responses. While none of the studies described the implementation of Reddit-based interventions, several studies have the potential to be used toward such purposes. For example, the study by ElSherief et al [<xref ref-type="bibr" rid="ref60">60</xref>] aimed to identify misinformation related to MOUD. It is natural to foresee how such a tool could be used on a routine basis to detect existing and new myths, and both respond to those posts providing evidence-based information as well as to compile these myths to guide public health messaging by providers and relevant agencies. Studies presenting methods to identify users at high risk of relapse [<xref ref-type="bibr" rid="ref55">55</xref>] or suicide [<xref ref-type="bibr" rid="ref57">57</xref>] could also be used to reach out to these individuals with helpful resources, including crisis lines and other types of support, as has been done in other studies [<xref ref-type="bibr" rid="ref69">69</xref>-<xref ref-type="bibr" rid="ref71">71</xref>]. Similarly, those identified as having a high probability of transitioning to an opioid recovery subreddit could benefit from information and resources to engage in treatment, counseling, support groups, or activities to facilitate this process [<xref ref-type="bibr" rid="ref53">53</xref>].</p>
      </sec>
      <sec>
        <title>Methodological Remarks and Recommendations</title>
        <p>The NLP methods used by the selected studies were diverse. We provided a map to identify appropriate methods depending on the research problem addressed. In addition, we have endeavored to bring clarity regarding the different types of data used in the studies. The commonly used term <italic>post</italic>, used across many studies is not specific enough as it does not fully characterize the data considered (first submission, comment, or whether it includes the title). Similarly, it is not always clear how many posts were included in the analyses (eg, all those available over a period versus a sample of the posts submitted) and how many different users these posts represented. Importantly, details about the subreddits considered and the period covered are not systematically specified. Best practices for Reddit or other social media platforms’ data description should include these key characteristics to improve transparency about the representativity of the data and to enable its reproducibility.</p>
        <p>We also found important variation in terms of the use of “dictionaries” to enable the identification of opioid use–related content, which can have an impact on the results through modifying the body of data examined. We, therefore, offer an important resource to increase the quality of new research on opioid use undertaken in this space through the synset we compiled and shared in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>.</p>
        <p>Regarding the use of NLP on Reddit data, some considerations should be highlighted. Approaching Reddit data from an exploratory perspective, at least initially, is useful to ascertain the extent to which Reddit data are suitable for your particular research question. Careful selection of appropriate subreddits is important given that each subreddit has a distinct culture and associated norms. For example, the r/trees subreddit is devoted to the discussion of cannabis use, whereas the r/marijuanaenthusiasts subreddit is devoted to the discussion of arboreal matters. Reddit-based research—particularly in health-related areas—should be assessed by research ethics committees or IRBs and follow research ethics protocols related to privacy protection. For example, Benton et al [<xref ref-type="bibr" rid="ref72">72</xref>] recommend adopting policies related to privacy protection (eg, refraining from using direct quotations in presentations and publications) and—where appropriate—deidentifying data (eg, using anonymous numerical codes in the place of social media usernames).</p>
        <p>Recent changes in Reddit’s application programming interface access have the potential to affect future research that relies on real-time, high-throughput data access. However, historical data (before April 2023) remains publicly available via PushShift and the free Reddit application programming interface (accessed via PRAW in Python) can be used to collect recent posts containing specific keywords. Furthermore, it is possible to purchase data from Reddit, with the study by Poudel and Weninger [<xref ref-type="bibr" rid="ref73">73</xref>] estimating a potential cost of US $240 per 1 million posts. Finally, as of late May 2024, Reddit is planning on implementing a new service aimed at providing academic researchers with affordable data [<xref ref-type="bibr" rid="ref74">74</xref>].</p>
        <p>Given the rapid changes in NLP technology, it is difficult to predict the future directions of application of NLP methods to address substance use disorders–related research questions, particularly concerning the future performance of large language models such as Gemini and ChatGPT (OpenAI LP). However, 2 broad themes are emerging. First, a growing democratization of NLP methods, given that generative NLP methods allow for the creation of baseline NLP tools by public health experts with relatively little computer science expertise (for example, by using prompt engineering approaches). Second, potentially increasing costs associated with accessing data for research given the industry-wide drive to monetize social media data.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our findings highlight 2 fundamental paradoxes associated with NLP-based research on opioids using content from Reddit. The first paradox relates to the anonymity afforded to Reddit users to disclose their own experiences and viewpoints related to opioid use. While this anonymity is advantageous as far as it supports the availability of evidence offering unique insights compared to other sources (eg, routine household surveys), it also represents a limitation because it implies a lack of demographic and clinical information on study participants. This may cast doubts upon the authenticity of the findings as there is no way of verifying whether the content reflects firsthand experiences or whether study participants meet the clinical criteria for a diagnosis of OUD. The second paradox relates to the methodological capabilities of NLP techniques to draw inferences from user-generated textual data. These computational methods have facilitated the large-scale computation of specific tasks, such as content identification and detection of textual patterns involving huge quantities of data. Despite these advances, there appear to be limits on the types of inferences that NLP methods can make, particularly when it comes to analyses that go beyond content identification (eg, posts related to opioid use) and attempt to interpret meaning. This observation corresponds with findings elsewhere, showing that NLP methods are valuable adjuncts to traditional qualitative research methods but do not yet represent an adequate alternative to human analyses [<xref ref-type="bibr" rid="ref75">75</xref>].</p>
        <p>Despite the extensive use of bespoke lexica to perform analysis of social media text, these lexicon-based approaches remain error-prone due to ambiguities characteristic of natural language. For example, different drugs may be referred to by the same slang term in different contexts (eg, “junk” can be used to refer to either heroin or cocaine).</p>
        <p>A methodological limitation of this scoping review is the inclusion of papers exclusively written in English. Although more than half of Reddit users are from countries with the ongoing opioid epidemic and that speak predominantly English, such as the United States, United Kingdom, Canada, and Australia [<xref ref-type="bibr" rid="ref24">24</xref>], this imposes a potential constrain on the understanding of how researchers are using NLP methods in Reddit to investigate opioid use.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This comprehensive review explores the expanding application of NLP methodologies to analyze text data sourced from Reddit, with a particular focus on opioid-related subreddits. A wide variety of NLP techniques and applications can be observed in the literature that demonstrate the potential for NLP use to support surveillance and social media interventions addressing the opioid crisis. Although we found that these methods offer useful insights into the behavior and attitudes of people who use opioids, there are limits to the utility of these automated approaches, with current methods best thought of as supplementary to current, established epidemiological methods.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Joanna Briggs Institute population (or participants)/concept/context (PCC) framework rationale behind each research question.</p>
        <media xlink:href="infodemiology_v4i1e51156_app1.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Search terms strategy.</p>
        <media xlink:href="infodemiology_v4i1e51156_app2.docx" xlink:title="DOCX File , 200 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews) checklist.</p>
        <media xlink:href="infodemiology_v4i1e51156_app3.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Data extraction table.</p>
        <media xlink:href="infodemiology_v4i1e51156_app4.xls" xlink:title="XLS File  (Microsoft Excel File), 144 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Brief definitions of the natural language processing methods most used by the scoping review papers, according to Wikipedia (accessed on January 20, 2023).</p>
        <media xlink:href="infodemiology_v4i1e51156_app5.docx" xlink:title="DOCX File , 19 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Synset.</p>
        <media xlink:href="infodemiology_v4i1e51156_app6.xls" xlink:title="XLS File  (Microsoft Excel File), 42 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">DAR</term>
          <def>
            <p>drug addiction recovery</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">IRB</term>
          <def>
            <p>institutional review board</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">JBI</term>
          <def>
            <p>Joanna Briggs Institute</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MOUD</term>
          <def>
            <p>medication for opioid use disorder</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">OUD</term>
          <def>
            <p>opioid use disorder</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PRISMA</term>
          <def>
            <p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">PRISMA-ScR</term>
          <def>
            <p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was funded by the National Institute on Drug Abuse DP2 DA049295 grant (principal investigator AB). TP acknowledges funding from the T32 DA023356 grant, and MC acknowledges funding from the National Institute on Drug Abuse R21DA05668 grant.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Degenhardt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Grebely</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hickman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vickerman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Bruneau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Altice</surname>
              <given-names>Fl</given-names>
            </name>
            <name name-style="western">
              <surname>Henderson</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rahimi-Movaghar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Larney</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Global patterns of opioid use and dependence: harms to populations, interventions, and future action</article-title>
          <source>Lancet</source>
          <year>2019</year>
          <month>10</month>
          <day>26</day>
          <volume>394</volume>
          <issue>10208</issue>
          <fpage>1560</fpage>
          <lpage>79</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31657732"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(19)32229-9</pub-id>
          <pub-id pub-id-type="medline">31657732</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(19)32229-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7068135</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>UNODC world drug report 2019</article-title>
          <source>UN Office on Drugs and Crime</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://tinyurl.com/zbxdwx7k">https://tinyurl.com/zbxdwx7k</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Drug overdose death rates</article-title>
          <source>National Institute on Drug Abuse</source>
          <year>2023</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://nida.nih.gov/research-topics/trends-statistics/overdose-death-rates">https://nida.nih.gov/research-topics/trends-statistics/overdose-death-rates</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <article-title>U.S. overdose deaths in 2021 increased half as much as in 2020 – but are still up 15%</article-title>
          <source>National Center for Health Statistics</source>
          <year>2022</year>
          <access-date>2024-04-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/nchs/pressroom/nchs_press_releases/2022/202205.htm#:~:text=Provisional%20data%20from%20CDC's%20National,93%2C655%20deaths%20estimated%20in%202020">https://www.cdc.gov/nchs/pressroom/nchs_press_releases/2022/202205.htm#:~:text=Provisional%20data%20from%20CDC's%20National,93%2C655%20deaths%20estimated%20in%202020</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allem</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Dharmapuri</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz</surname>
              <given-names>TB</given-names>
            </name>
          </person-group>
          <article-title>Characterizing JUUL-related posts on Twitter</article-title>
          <source>Drug Alcohol Depend</source>
          <year>2018</year>
          <month>09</month>
          <day>01</day>
          <volume>190</volume>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29958115"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.drugalcdep.2018.05.018</pub-id>
          <pub-id pub-id-type="medline">29958115</pub-id>
          <pub-id pub-id-type="pii">S0376-8716(18)30333-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6693487</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Giorgi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Buffone</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Ashford</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Hemmons</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Summers</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Can Twitter be used to predict county excessive alcohol consumption rates?</article-title>
          <source>PLoS One</source>
          <year>2018</year>
          <volume>13</volume>
          <issue>4</issue>
          <fpage>e0194290</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0194290"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0194290</pub-id>
          <pub-id pub-id-type="medline">29617408</pub-id>
          <pub-id pub-id-type="pii">PONE-D-17-28471</pub-id>
          <pub-id pub-id-type="pmcid">PMC5884504</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lazard</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Saffer</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wilcox</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Mackert</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Bernhardt</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>E-cigarette social media messages: a text mining analysis of marketing and consumer conversations on Twitter</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2016</year>
          <month>12</month>
          <day>12</day>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e171</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2016/2/e171/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.6551</pub-id>
          <pub-id pub-id-type="medline">27956376</pub-id>
          <pub-id pub-id-type="pii">v2i2e171</pub-id>
          <pub-id pub-id-type="pmcid">PMC5187450</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kalyanam</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Klugman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kuzmenko</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Solution to detect, classify, and report illicit online marketing and sales of controlled substances via Twitter: using machine learning and web forensics to combat digital opioid access</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>04</month>
          <day>27</day>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>e10029</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/4/e10029/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10029</pub-id>
          <pub-id pub-id-type="medline">29613851</pub-id>
          <pub-id pub-id-type="pii">v20i4e10029</pub-id>
          <pub-id pub-id-type="pmcid">PMC5948414</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Kalyanam</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Katsuki</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lanckriet</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Twitter-based detection of illegal online sale of prescription opioid</article-title>
          <source>Am J Public Health</source>
          <year>2017</year>
          <month>12</month>
          <volume>107</volume>
          <issue>12</issue>
          <fpage>1910</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.2105/AJPH.2017.303994</pub-id>
          <pub-id pub-id-type="medline">29048960</pub-id>
          <pub-id pub-id-type="pmcid">PMC5678375</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Simpson</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Brugman</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Conners</surname>
              <given-names>TJ</given-names>
            </name>
          </person-group>
          <article-title>Detecting novel and emerging drug terms using natural language processing: a social media corpus study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2018</year>
          <month>01</month>
          <day>08</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>e2</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2018/1/e2/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.7726</pub-id>
          <pub-id pub-id-type="medline">29311050</pub-id>
          <pub-id pub-id-type="pii">v4i1e2</pub-id>
          <pub-id pub-id-type="pmcid">PMC5838358</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>What online communities can tell us about electronic cigarettes and hookah use: a study using text mining and visualization techniques</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <month>09</month>
          <day>29</day>
          <volume>17</volume>
          <issue>9</issue>
          <fpage>e220</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2015/9/e220/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4517</pub-id>
          <pub-id pub-id-type="medline">26420469</pub-id>
          <pub-id pub-id-type="pii">v17i9e220</pub-id>
          <pub-id pub-id-type="pmcid">PMC4642380</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meacham</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ramo</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>Understanding emerging forms of cannabis use through an online cannabis community: an analysis of relative post volume and subjective highness ratings</article-title>
          <source>Drug Alcohol Depend</source>
          <year>2018</year>
          <month>07</month>
          <day>01</day>
          <volume>188</volume>
          <fpage>364</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29883950"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.drugalcdep.2018.03.041</pub-id>
          <pub-id pub-id-type="medline">29883950</pub-id>
          <pub-id pub-id-type="pii">S0376-8716(18)30242-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC6692176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Leischow</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>DD</given-names>
            </name>
          </person-group>
          <article-title>Identifying topics for e-cigarette user-generated contents: a case study from multiple social media platforms</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>01</month>
          <day>20</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>e24</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/1/e24/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5780</pub-id>
          <pub-id pub-id-type="medline">28108428</pub-id>
          <pub-id pub-id-type="pii">v19i1e24</pub-id>
          <pub-id pub-id-type="pmcid">PMC5291865</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cuomo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Purushothaman</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Calac</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>McMann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Estimating county-level overdose rates using opioid-related twitter data: interdisciplinary infodemiology study</article-title>
          <source>JMIR Form Res</source>
          <year>2023</year>
          <month>01</month>
          <day>25</day>
          <volume>7</volume>
          <fpage>e42162</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2023//e42162/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/42162</pub-id>
          <pub-id pub-id-type="medline">36548118</pub-id>
          <pub-id pub-id-type="pii">v7i1e42162</pub-id>
          <pub-id pub-id-type="pmcid">PMC9909516</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Hernandez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ruan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Perrone</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Machine learning and natural language processing for geolocation-centric monitoring and characterization of opioid-related social media chatter</article-title>
          <source>JAMA Netw Open</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>2</volume>
          <issue>11</issue>
          <fpage>e1914672</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31693125"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2019.14672</pub-id>
          <pub-id pub-id-type="medline">31693125</pub-id>
          <pub-id pub-id-type="pii">2753983</pub-id>
          <pub-id pub-id-type="pmcid">PMC6865282</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kilgo</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Midberry</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Social media news production, emotional Facebook reactions, and the politicization of drug addiction</article-title>
          <source>Health Commun</source>
          <year>2022</year>
          <month>03</month>
          <volume>37</volume>
          <issue>3</issue>
          <fpage>375</fpage>
          <lpage>83</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1080/10410236.2020.1846265"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10410236.2020.1846265</pub-id>
          <pub-id pub-id-type="medline">33213217</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Potter</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Bad actors never sleep: content manipulation on Reddit</article-title>
          <source>Continuum</source>
          <year>2021</year>
          <month>09</month>
          <day>28</day>
          <volume>35</volume>
          <issue>5</issue>
          <fpage>706</fpage>
          <lpage>18</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1080/10304312.2021.1983254"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10304312.2021.1983254</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
          </person-group>
          <article-title>Recent advances in using natural language processing to address public health research questions using social media and consumergenerated data</article-title>
          <source>Yearb Med Inform</source>
          <year>2019</year>
          <month>08</month>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>208</fpage>
          <lpage>17</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0039-1677918"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0039-1677918</pub-id>
          <pub-id pub-id-type="medline">31419834</pub-id>
          <pub-id pub-id-type="pmcid">PMC6697505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Chau</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Matthew Gladden</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sumner</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Detection of emerging drugs involved in overdose via diachronic word embeddings of substances discussed on social media</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>07</month>
          <volume>119</volume>
          <fpage>103824</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00153-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103824</pub-id>
          <pub-id pub-id-type="medline">34048933</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00153-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10901232</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Reddit claims 52 million daily users, revealing a key figure for social-media platforms</article-title>
          <source>The Wall Street journal</source>
          <year>2020</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.wsj.com/articles/reddit-claims-52-million-daily-users-revealing-a-key-figure-for-social-media-platforms-11606822200">https://www.wsj.com/articles/reddit-claims-52-million-daily-users-revealing-a-key-figure-for-social-media-platforms-11606822200</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>LU</given-names>
            </name>
            <name name-style="western">
              <surname>Bie</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Social media and outbreaks of emerging infectious diseases: a systematic review of literature</article-title>
          <source>Am J Infect Control</source>
          <year>2018</year>
          <month>09</month>
          <volume>46</volume>
          <issue>9</issue>
          <fpage>962</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29628293"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ajic.2018.02.010</pub-id>
          <pub-id pub-id-type="medline">29628293</pub-id>
          <pub-id pub-id-type="pii">S0196-6553(18)30105-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7115293</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>El-Bassel</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hochstatter</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Slavin</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Muresan</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Harnessing the power of social media to understand the impact of COVID-19 on people who use drugs during lockdown and social distancing</article-title>
          <source>J Addict Med</source>
          <year>2022</year>
          <volume>16</volume>
          <issue>2</issue>
          <fpage>e123</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34145186"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ADM.0000000000000883</pub-id>
          <pub-id pub-id-type="medline">34145186</pub-id>
          <pub-id pub-id-type="pii">01271255-202204000-00029</pub-id>
          <pub-id pub-id-type="pmcid">PMC8678390</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nataraj</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Siu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Sumner</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Concerns among people who use opioids during the COVID-19 pandemic: a natural language processing analysis of social media posts</article-title>
          <source>Subst Abuse Treat Prev Policy</source>
          <year>2022</year>
          <month>03</month>
          <day>05</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>16</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://substanceabusepolicy.biomedcentral.com/articles/10.1186/s13011-022-00442-w"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13011-022-00442-w</pub-id>
          <pub-id pub-id-type="medline">35248103</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13011-022-00442-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC8897722</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Reddit user and growth stats</article-title>
          <source>Backlinko</source>
          <year>2021</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://backlinko.com/reddit-users">https://backlinko.com/reddit-users</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arksey</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>O'Malley</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Scoping studies: towards a methodological framework</article-title>
          <source>Int J Soc Res Methodol</source>
          <year>2005</year>
          <month>02</month>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>19</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1080/1364557032000119616"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/1364557032000119616</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levac</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Colquhoun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>KK</given-names>
            </name>
          </person-group>
          <article-title>Scoping studies: advancing the methodology</article-title>
          <source>Implement Sci</source>
          <year>2010</year>
          <month>09</month>
          <day>20</day>
          <volume>5</volume>
          <fpage>69</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://implementationscience.biomedcentral.com/articles/10.1186/1748-5908-5-69"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1748-5908-5-69</pub-id>
          <pub-id pub-id-type="medline">20854677</pub-id>
          <pub-id pub-id-type="pii">1748-5908-5-69</pub-id>
          <pub-id pub-id-type="pmcid">PMC2954944</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <article-title>The use of artificial intelligence methods in Reddit to investigate opioid use: a scoping review</article-title>
          <source>Open Science Framework</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://osf.io/ftqj3">https://osf.io/ftqj3</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <article-title>Prescription opioids DrugFacts</article-title>
          <source>National Institute on Drug Abuse</source>
          <year>2021</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://nida.nih.gov/publications/drugfacts/prescription-opioids">https://nida.nih.gov/publications/drugfacts/prescription-opioids</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <article-title>Effective treatments for opioid addiction</article-title>
          <source>National Institute on Drug Abuse</source>
          <year>2016</year>
          <access-date>2024-07-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://tinyurl.com/mry9kknr">https://tinyurl.com/mry9kknr</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <article-title>MeSH: artificial intelligence</article-title>
          <source>National Library of Medicine</source>
          <year>2022</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ncbi.nlm.nih.gov/mesh/68001185">https://www.ncbi.nlm.nih.gov/mesh/68001185</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Lillie</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zarin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Colquhoun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Levac</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Horsley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weeks</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hempel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>McGowan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hartling</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aldcroft</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Garritty</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lewin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Godfrey</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Macdonald</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Langlois</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Soares-Weiser</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moriarty</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tunçalp</surname>
              <given-names>Ö</given-names>
            </name>
            <name name-style="western">
              <surname>Straus</surname>
              <given-names>SE</given-names>
            </name>
          </person-group>
          <article-title>PRISMA extension for scoping reviews (PRISMA-ScR): checklist and explanation</article-title>
          <source>Ann Intern Med</source>
          <year>2018</year>
          <month>10</month>
          <day>02</day>
          <volume>169</volume>
          <issue>7</issue>
          <fpage>467</fpage>
          <lpage>73</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.acpjournals.org/doi/abs/10.7326/M18-0850?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.7326/M18-0850</pub-id>
          <pub-id pub-id-type="medline">30178033</pub-id>
          <pub-id pub-id-type="pii">2700389</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Page</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>McKenzie</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Bossuyt</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Boutron</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Mulrow</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Shamseer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tetzlaff</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Glanville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grimshaw</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hróbjartsson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lalu</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Loder</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Mayo-Wilson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McGuinness</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Welch</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Whiting</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>
          <source>BMJ</source>
          <year>2021</year>
          <month>03</month>
          <day>29</day>
          <volume>372</volume>
          <fpage>n71</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=33782057"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id>
          <pub-id pub-id-type="medline">33782057</pub-id>
          <pub-id pub-id-type="pmcid">PMC8005924</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Preiss</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Baumgartner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Edlund</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bobashev</surname>
              <given-names>GV</given-names>
            </name>
          </person-group>
          <article-title>Using named entity recognition to identify substances used in the self-medication of opioid withdrawal: natural language processing study of reddit data</article-title>
          <source>JMIR Form Res</source>
          <year>2022</year>
          <month>03</month>
          <day>30</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>e33919</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2022/3/e33919/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/33919</pub-id>
          <pub-id pub-id-type="medline">35353047</pub-id>
          <pub-id pub-id-type="pii">v6i3e33919</pub-id>
          <pub-id pub-id-type="pmcid">PMC9008522</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the Internet</article-title>
          <source>J Med Internet Res</source>
          <year>2009</year>
          <month>03</month>
          <day>27</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>e11</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2009/1/e11/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
          <pub-id pub-id-type="medline">19329408</pub-id>
          <pub-id pub-id-type="pii">v11i1e11</pub-id>
          <pub-id pub-id-type="pmcid">PMC2762766</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology and infoveillance tracking online health information and cyberbehavior for public health</article-title>
          <source>Am J Prev Med</source>
          <year>2011</year>
          <month>05</month>
          <volume>40</volume>
          <issue>5 Suppl 2</issue>
          <fpage>S154</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.amepre.2011.02.006"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.amepre.2011.02.006</pub-id>
          <pub-id pub-id-type="medline">21521589</pub-id>
          <pub-id pub-id-type="pii">S0749-3797(11)00088-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <article-title>Regulation and prequalification - what is pharmacovigilance?</article-title>
          <source>World Health Organization</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/teams/regulation-prequalification/regulation-and-safety/pharmacovigilance">https://www.who.int/teams/regulation-prequalification/regulation-and-safety/pharmacovigilance</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Artigiani</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Wish</surname>
              <given-names>ED</given-names>
            </name>
          </person-group>
          <article-title>Choosing your platform for social media drug research and improving your keyword filter list</article-title>
          <source>Journal of Drug Issues</source>
          <year>2019</year>
          <month>03</month>
          <day>13</day>
          <volume>49</volume>
          <issue>3</issue>
          <fpage>477</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/0022042619833911"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/0022042619833911</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akioyamen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Nicklas</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez-Arias</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A framework for intelligent navigation using latent Dirichlet allocation on reddit posts about opiates</article-title>
          <source>Proceedings of the 2020 4th International Conference on Compute and Data Analysis</source>
          <year>2020</year>
          <conf-name>ICCDA '20</conf-name>
          <conf-date>March 9-12, 2020</conf-date>
          <conf-loc>Silicon Valley, CA</conf-loc>
          <fpage>190</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1145/3388142.3388156"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3388142.3388156</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Sedig</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lizotte</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>Archetype-based modeling and search of social media</article-title>
          <source>Big Data Cogn Comput</source>
          <year>2019</year>
          <month>07</month>
          <day>24</day>
          <volume>3</volume>
          <issue>3</issue>
          <fpage>44</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3390/bdcc3030044"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/bdcc3030044</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jha</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>SMARTS: the social media-based addiction recovery and intervention targeting server</article-title>
          <source>Bioinformatics</source>
          <year>2019</year>
          <month>10</month>
          <day>24</day>
          <fpage>1970</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1093/bioinformatics/btz800"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz800</pub-id>
          <pub-id pub-id-type="medline">31647520</pub-id>
          <pub-id pub-id-type="pii">5606710</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Bhat</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Euphemistic phrase detection by masked language model</article-title>
          <source>Proceedings of the 2021 Association for Computational Linguistics</source>
          <year>2021</year>
          <conf-name>EMNLP '21</conf-name>
          <conf-date>November 7-11, 2021</conf-date>
          <conf-loc>Punta Cana, Dominican Republic</conf-loc>
          <fpage>163</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2021.findings-emnlp.16.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2021.findings-emnlp.16</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andy</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michalowski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bianco</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Self-disclosure in opioid use recovery forums</article-title>
          <source>AI for Disease Surveillance and Pandemic Intelligence: Intelligent Disease Detection in Action</source>
          <year>2022</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>65</fpage>
          <lpage>74</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Balsamo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bajardi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Salomone</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schifanella</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Patterns of routes of administration and drug tampering for nonmedical opioid consumption: data mining and content analysis of Reddit discussions</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>01</month>
          <day>04</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>e21212</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://hdl.handle.net/2318/1768936"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21212</pub-id>
          <pub-id pub-id-type="medline">33393910</pub-id>
          <pub-id pub-id-type="pii">v23i1e21212</pub-id>
          <pub-id pub-id-type="pmcid">PMC7813634</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jha</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Analysis of associations between emotions and activities of drug users and their addiction recovery tendencies from social media posts using structural equation modeling</article-title>
          <source>BMC Bioinformatics</source>
          <year>2020</year>
          <month>12</month>
          <day>30</day>
          <volume>21</volume>
          <issue>Suppl 18</issue>
          <fpage>554</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-020-03893-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-020-03893-9</pub-id>
          <pub-id pub-id-type="medline">33375934</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-020-03893-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7772931</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spadaro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hogg-Bremer</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Love</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donnell</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Perrone</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Reddit discussions about buprenorphine associated precipitated withdrawal in the era of fentanyl</article-title>
          <source>Clin Toxicol (Phila)</source>
          <year>2022</year>
          <month>06</month>
          <volume>60</volume>
          <issue>6</issue>
          <fpage>694</fpage>
          <lpage>701</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35119337"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/15563650.2022.2032730</pub-id>
          <pub-id pub-id-type="medline">35119337</pub-id>
          <pub-id pub-id-type="pmcid">PMC10457147</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pandrekar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gopalkrishna</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Social media based analysis of opioid epidemic using Reddit</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>867</fpage>
          <lpage>76</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30815129"/>
          </comment>
          <pub-id pub-id-type="medline">30815129</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371364</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>Does social support (expressed in post titles) elicit comments in online substance use recovery forums?</article-title>
          <source>Proceedings of the 4th Workshop on Natural Language Processing and Computational Social Science</source>
          <year>2020</year>
          <conf-name>NLPCSS '20</conf-name>
          <conf-date>November 20, 2020</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <fpage>35</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.18653/v1/2020.nlpcss-1.4"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2020.nlpcss-1.4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alambo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Padhee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Thirunarayan</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 and mental health/substance use disorders on reddit:  a longitudinal study</article-title>
          <source>Proceedings of the 2021 Conference on Pattern Recognition, ICPR International Workshops and Challenges</source>
          <year>2021</year>
          <conf-name>ICPR '21</conf-name>
          <conf-date>January 10-15, 2021</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <fpage>20</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1007/978-3-030-68790-8_2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/978-3-030-68790-8_2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramachandran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ring</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Tones and themes in Reddits posts discussing the opioid epidemic</article-title>
          <source>J Addict Dis</source>
          <year>2022</year>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>552</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1080/10550887.2022.2049170"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10550887.2022.2049170</pub-id>
          <pub-id pub-id-type="medline">35274598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gauthier</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Costello</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>“I will not drink with you today”: a topic-guided thematic analysis of addiction recovery on Reddit</article-title>
          <source>Proceedings of the 2022 CHI Conference on Human Factors in Computing Systems</source>
          <year>2022</year>
          <conf-name>CHI '22</conf-name>
          <conf-date>April 29- May 5, 2022</conf-date>
          <conf-loc>New Orleans, LA</conf-loc>
          <fpage>1</fpage>
          <lpage>17</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3491102.3502076"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3491102.3502076</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Johnny</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Examining stigma relating to substance use and contextual factors in social media discussions</article-title>
          <source>Drug Alcohol Depend Rep</source>
          <year>2022</year>
          <month>06</month>
          <volume>3</volume>
          <fpage>100061</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.dadr.2022.100061"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dadr.2022.100061</pub-id>
          <pub-id pub-id-type="medline">36845987</pub-id>
          <pub-id pub-id-type="pii">S2772-7246(22)00039-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC9948814</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Graves</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Perrone</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Garadi</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Love</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Hernandez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Thematic analysis of Reddit content about buprenorphine-naloxone using manual annotation and natural language processing techniques</article-title>
          <source>J Addict Med</source>
          <year>2022</year>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>454</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34864788"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ADM.0000000000000940</pub-id>
          <pub-id pub-id-type="medline">34864788</pub-id>
          <pub-id pub-id-type="pii">01271255-900000000-98966</pub-id>
          <pub-id pub-id-type="pmcid">PMC9365256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eshleman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jha</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Identifying individuals amenable to drug recovery interventions through computational analysis of addiction content in social media</article-title>
          <source>Proceedings of the 2017 IEEE International Conference on Bioinformatics and Biomedicine</source>
          <year>2017</year>
          <conf-name>BIBM '17</conf-name>
          <conf-date>November 13-6, 2017</conf-date>
          <conf-loc>Kansas City, MO</conf-loc>
          <fpage>849</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/BIBM.2017.8217766"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/bibm.2017.8217766</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>51</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sridhar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pandey</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Mohler</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Investigate transitions into drug addiction through text mining of reddit data</article-title>
          <source>Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery &#38; Data Mini</source>
          <year>2019</year>
          <conf-name>KDD '19</conf-name>
          <conf-date>August 4-8,2019</conf-date>
          <conf-loc>Anchorage, AK</conf-loc>
          <fpage>2367</fpage>
          <lpage>75</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3292500.3330737"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3292500.3330737</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jha</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>La Marca</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Identifying and characterizing opioid addiction states using social media posts</article-title>
          <source>Proceedings of the 2021 IEEE International Conference on Bioinformatics and Biomedicine</source>
          <year>2021</year>
          <conf-name>BIBM '21</conf-name>
          <conf-date>December 9-12, 2021</conf-date>
          <conf-loc>Houston, TX</conf-loc>
          <fpage>913</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/BIBM52615.2021.9669628"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/bibm52615.2021.9669628</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Opioid relapse prediction with GAN</article-title>
          <source>Proceedings of the 2019 IEEE/ACM International Conference on Advances in Social Networks Analysis and Mining</source>
          <year>2019</year>
          <conf-name>ASONAM '19</conf-name>
          <conf-date>August 27-30, 2019</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
          <fpage>560</fpage>
          <lpage>67</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3341161.3342951"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3341161.3342951</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Duanmu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenthal</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Detection of suicidality among opioid users on Reddit: machine learning-based approach</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>11</month>
          <day>27</day>
          <volume>22</volume>
          <issue>11</issue>
          <fpage>e15293</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/11/e15293/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/15293</pub-id>
          <pub-id pub-id-type="medline">33245287</pub-id>
          <pub-id pub-id-type="pii">v22i11e15293</pub-id>
          <pub-id pub-id-type="pmcid">PMC7732714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chancellor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nitzburg</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zampieri</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Choudhury</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>Discovering alternative treatments for opioid use recovery using social media</article-title>
          <source>Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems</source>
          <year>2019</year>
          <conf-name>CHI '19</conf-name>
          <conf-date>May 4-9, 2019</conf-date>
          <conf-loc>Glasgow, UK</conf-loc>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3290605.3300354"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3290605.3300354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bradshaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hewett</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Discovering opioid use patterns from social media for relapse prevention</article-title>
          <source>Computer</source>
          <year>2022</year>
          <month>2</month>
          <volume>55</volume>
          <issue>2</issue>
          <fpage>23</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/MC.2021.3095826"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/mc.2021.3095826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>ElSherief</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sumner</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Law</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Kacha-Ochana</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shieber</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cordier</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Holton</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>De Choudhury</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Characterizing and identifying the prevalence of web-based misinformation relating to medication for opioid use disorder: machine learning approach</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>12</month>
          <day>22</day>
          <volume>23</volume>
          <issue>12</issue>
          <fpage>e30753</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/12/e30753/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30753</pub-id>
          <pub-id pub-id-type="medline">34941555</pub-id>
          <pub-id pub-id-type="pii">v23i12e30753</pub-id>
          <pub-id pub-id-type="pmcid">PMC8734931</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Garadi</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Nataraj</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Sumner</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Signals of increasing co-use of stimulants and opioids from online drug forum data</article-title>
          <source>Harm Reduct J</source>
          <year>2022</year>
          <month>05</month>
          <day>25</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>51</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://harmreductionjournal.biomedcentral.com/articles/10.1186/s12954-022-00628-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12954-022-00628-2</pub-id>
          <pub-id pub-id-type="medline">35614501</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12954-022-00628-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC9131693</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sumner</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Bowen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Holland</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zwald</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vivolo-Kantor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Guy</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Heuett</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Pressley</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Estimating weekly national opioid overdose deaths in near real time using multiple proxy data sources</article-title>
          <source>JAMA Netw Open</source>
          <year>2022</year>
          <month>07</month>
          <day>01</day>
          <volume>5</volume>
          <issue>7</issue>
          <fpage>e2223033</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35862045"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2022.23033</pub-id>
          <pub-id pub-id-type="medline">35862045</pub-id>
          <pub-id pub-id-type="pii">2794462</pub-id>
          <pub-id pub-id-type="pmcid">PMC9305381</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="web">
          <article-title>Drug slang code words</article-title>
          <source>Drug Enforcement Administration</source>
          <year>2017</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ndews.umd.edu/sites/ndews.umd.edu/files/dea-drug-slang-code-words-may2017.pdf">https://ndews.umd.edu/sites/ndews.umd.edu/files/dea-drug-slang-code-words-may2017.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lokala</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Lamy</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Daniulaityte</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gaur</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gyrard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thirunarayan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kursuncu</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Sheth</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Drug abuse ontology to harness web-based data for substance use epidemiology research: ontology development study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2022</year>
          <month>12</month>
          <day>23</day>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>e24938</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2022/12/e24938/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24938</pub-id>
          <pub-id pub-id-type="medline">36563032</pub-id>
          <pub-id pub-id-type="pii">v8i12e24938</pub-id>
          <pub-id pub-id-type="pmcid">PMC9823583</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="web">
          <article-title>Home page</article-title>
          <source>The Urban Dictionary</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.urbandictionary.com/define.php?term=a%7Cnd">https://www.urbandictionary.com/define.php?term=a%7Cnd</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arshonsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bunting</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Bragg</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Informal coping strategies among people who use opioids during COVID-19: thematic analysis of reddit forums</article-title>
          <source>JMIR Form Res</source>
          <year>2022</year>
          <month>03</month>
          <day>03</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>e32871</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2022/3/e32871/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/32871</pub-id>
          <pub-id pub-id-type="medline">35084345</pub-id>
          <pub-id pub-id-type="pii">v6i3e32871</pub-id>
          <pub-id pub-id-type="pmcid">PMC8896559</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bunting</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Arshonsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bragg</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Socially-supportive norms and mutual aid of people who use opioids: an analysis of Reddit during the initial COVID-19 pandemic</article-title>
          <source>Drug Alcohol Depend</source>
          <year>2021</year>
          <month>05</month>
          <day>01</day>
          <volume>222</volume>
          <fpage>108672</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33757708"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.drugalcdep.2021.108672</pub-id>
          <pub-id pub-id-type="medline">33757708</pub-id>
          <pub-id pub-id-type="pii">S0376-8716(21)00167-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8057693</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bunting</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Arshonsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Bragg</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>"How will I get my next week's script?" Reactions of Reddit opioid forum users to changes in treatment access in the early months of the coronavirus pandemic</article-title>
          <source>Int J Drug Policy</source>
          <year>2021</year>
          <month>06</month>
          <volume>92</volume>
          <fpage>103140</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33558165"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.drugpo.2021.103140</pub-id>
          <pub-id pub-id-type="medline">33558165</pub-id>
          <pub-id pub-id-type="pii">S0955-3959(21)00038-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8994991</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Keasar</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Sznitman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Baumel</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Suicide prevention outreach on social media delivered by trained volunteers</article-title>
          <source>Crisis</source>
          <year>2023</year>
          <month>05</month>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>247</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1027/0227-5910/a000864"/>
          </comment>
          <pub-id pub-id-type="doi">10.1027/0227-5910/a000864</pub-id>
          <pub-id pub-id-type="medline">35656647</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Proactive suicide prevention online (PSPO): machine identification and crisis management for Chinese social media users with suicidal thoughts and behaviors</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>05</month>
          <day>08</day>
          <volume>21</volume>
          <issue>5</issue>
          <fpage>e11705</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/5/e11705/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11705</pub-id>
          <pub-id pub-id-type="medline">31344675</pub-id>
          <pub-id pub-id-type="pii">v21i5e11705</pub-id>
          <pub-id pub-id-type="pmcid">PMC6682269</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Notredame</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Grandgenèvre</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pauwels</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Morgiève</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wathelet</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vaiva</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Séguin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Leveraging the web and social media to promote access to care among suicidal individuals</article-title>
          <source>Front Psychol</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>1338</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30154742"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyg.2018.01338</pub-id>
          <pub-id pub-id-type="medline">30154742</pub-id>
          <pub-id pub-id-type="pmcid">PMC6102313</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Coppersmith</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Ethical research protocols for social media health research</article-title>
          <source>Proceedings of the 1st ACL Workshop on Ethics in Natural Language Processing</source>
          <year>2017</year>
          <conf-name>EthNLP '17</conf-name>
          <conf-date>April 4th, 2017</conf-date>
          <conf-loc>Valencia, Spain</conf-loc>
          <fpage>94</fpage>
          <lpage>102</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.18653/v1/W17-1612"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/w17-1612</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Poudel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weninger</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Navigating the post-API dilemma search engine results pages present a biased view of social media data</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online March 11, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/ARXIV.2401.15479"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3589334.3645503</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="web">
          <article-title>r/research</article-title>
          <source>Reddit</source>
          <year>2024</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.reddit.com/r/research/">https://www.reddit.com/r/research/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leeson</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Resnick</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rovers</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing (NLP) in qualitative public health research: a proof of concept study</article-title>
          <source>Int J Qual Methods</source>
          <year>2019</year>
          <month>11</month>
          <day>13</day>
          <volume>18</volume>
          <fpage>160940691988702</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/1609406919887021"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1609406919887021</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
