<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Infodemiology</journal-id><journal-id journal-id-type="publisher-id">infodemiology</journal-id><journal-id journal-id-type="index">38</journal-id><journal-title>JMIR Infodemiology</journal-title><abbrev-journal-title>JMIR Infodemiology</abbrev-journal-title><issn pub-type="epub">2564-1891</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v5i1e65835</article-id><article-id pub-id-type="doi">10.2196/65835</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Exploring Social Media Posts on Lifestyle Behaviors: Sentiment and Content Analysis</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Yip</surname><given-names>Yan Yee</given-names></name><degrees>MPharm, MClinPharm</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yaakub</surname><given-names>Mohd Ridzwan</given-names></name><degrees>BSc, MSc, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Makmor-Bakry</surname><given-names>Mohd</given-names></name><degrees>BPharm, MClinPharm, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Abu Latiffi</surname><given-names>Muhammad Iqbal</given-names></name><degrees>BSc, MSc</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Chong</surname><given-names>Wei Wen</given-names></name><degrees>BPharm, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Centre for Quality Management of Medicines, Faculty of Pharmacy, Universiti Kebangsaan Malaysia</institution><addr-line>Jalan Raja Muda Abdul Aziz</addr-line><addr-line>Kuala Lumpur</addr-line><country>Malaysia</country></aff><aff id="aff2"><institution>Centre for Clinical Epidemiology, Institute for Clinical Research, National Institutes of Health, Ministry of Health Malaysia</institution><addr-line>Setia Alam, Shah Alam</addr-line><country>Malaysia</country></aff><aff id="aff3"><institution>Center for Artificial Intelligence Technology, Faculty of Information Science &#x0026; Technology, Universiti Kebangsaan Malaysia</institution><addr-line>Bangi, Selangor Darul Ehsan</addr-line><country>Malaysia</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Haupt</surname><given-names>Michael</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Rasool</surname><given-names>Abdur</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Gore</surname><given-names>Ross</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Wei Wen Chong, BPharm, PhD, Centre for Quality Management of Medicines, Faculty of Pharmacy, Universiti Kebangsaan Malaysia, Jalan Raja Muda Abdul Aziz, Kuala Lumpur, 50300, Malaysia, 60 392897265; <email>weiwen@ukm.edu.my</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>25</day><month>6</month><year>2025</year></pub-date><volume>5</volume><elocation-id>e65835</elocation-id><history><date date-type="received"><day>24</day><month>09</month><year>2024</year></date><date date-type="rev-recd"><day>26</day><month>01</month><year>2025</year></date><date date-type="accepted"><day>13</day><month>02</month><year>2025</year></date></history><copyright-statement>&#x00A9; Yan Yee Yip, Mohd Ridzwan Yaakub, Mohd Makmor-Bakry, Muhammad Iqbal Abu Latiffi, Wei Wen Chong. Originally published in JMIR Infodemiology (<ext-link ext-link-type="uri" xlink:href="https://infodemiology.jmir.org">https://infodemiology.jmir.org</ext-link>), 25.6.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Infodemiology, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://infodemiology.jmir.org/">https://infodemiology.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2025/1/e65835"/><abstract><sec><title>Background</title><p>There has been an increase in the prevalence of noncommunicable diseases in Malaysia. This can be prevented and managed through the adoption of healthy lifestyle behaviors, including not smoking, avoiding alcohol consumption, maintaining a balanced diet, and being physically active. The growing importance of using social media to deliver information on healthy behaviors has led health care professionals (HCPs) to lead these efforts. To ensure effective delivery of information on healthy lifestyle behaviors, HCPs should begin by understanding users&#x2019; current opinions about these behaviors and whether the users are receptive to recommended health practices. Nevertheless, there has been limited research conducted in Malaysia that aims to identify the sentiments and content of posts, as well as how well users&#x2019; perceptions align with recommended health practices.</p></sec><sec><title>Objective</title><p>This study aims to examine social media posts related to various lifestyle behaviors, by using a combination of sentiment analysis to analyze users&#x2019; sentiments and manual content analysis to explore the content of the posts and how well users&#x2019; perceptions align with recommended health practices.</p></sec><sec sec-type="methods"><title>Methods</title><p>Using keywords based on lifestyle behaviors, posts originating from X (formerly known as Twitter) and published in Malaysia between November and December 2022 were scraped for sentiment analysis. Posts with positive and negative sentiments were randomly selected for content analysis. A codebook was developed to code the selected posts according to content and alignment of users&#x2019; perceptions with recommended health practices.</p></sec><sec sec-type="results"><title>Results</title><p>A total of 3320 posts were selected for sentiment analysis. Significant associations were observed between sentiment class and lifestyle behaviors (<italic>&#x03C7;</italic><sup>2</sup><sub>6</sub>=67.64; <italic>P</italic>&#x003C;.001), with positive sentiments higher than negative sentiments for all lifestyle behaviors. Findings from content analysis of 1328 posts revealed that most of the posts were about users&#x2019; narratives (492/1328), general statements (203/1328), and planned actions toward the conduct of their behavior (196/1328). More than half of tobacco-, diet-, and activity-related posts were aligned with recommended health practices, whereas most of the alcohol-related posts were not aligned with recommended health practices (63/112).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>As most of the alcohol-related posts did not align with recommended health practices, the findings reflect a need for HCPs to increase their delivery of health information on alcohol consumption. It is also important to ensure the ongoing health promotion of the other 3 lifestyle behaviors on social media, while continuing to monitor the discussions made by social media users.</p></sec></abstract><kwd-group><kwd>consumer health information</kwd><kwd>content analysis</kwd><kwd>chronic illness</kwd><kwd>health promotion</kwd><kwd>healthy lifestyle</kwd><kwd>lifestyle</kwd><kwd>lifestyle risk reduction</kwd><kwd>internet</kwd><kwd>primary prevention</kwd><kwd>sentiment analysis</kwd><kwd>social media</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Noncommunicable diseases (NCDs) have become a significant global health challenge, accounting for 74% of all deaths worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. NCDs have also become a growing public health concern in middle-income countries within the Southeast Asia region. Malaysia is one of the countries in the region that has been significantly impacted by NCDs, with over 67% premature NCD-related mortality and over 70% disease burden [<xref ref-type="bibr" rid="ref2">2</xref>]. Approximately, 2.5% of Malaysian adults, which accounts for over half a million people were affected by all 4 major NCDs, which are diabetes, hypertension, hypercholesterolemia, and obesity [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>The World Health Organization (WHO) has identified 4 key modifiable risk factors associated with an elevated risk of NCDs, which are tobacco smoking, harmful use of alcohol, unhealthy diet, and physical inactivity [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. The adoption of healthy lifestyle behaviors, including not smoking, avoiding alcohol consumption, maintaining a balanced diet, and being physically active can reduce modifiable risk factors, effectively preventing and managing NCDs. However, national surveys have indicated that the actual adoption of healthy behaviors among Malaysians remains low. For example, over 84% of Malaysian adults were inactive in sports, with half of the population leading a sedentary lifestyle, spending more than 2 hours sitting while awake [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>In this regard, it is important to deliver information on healthy lifestyle behaviors, with health care professionals (HCPs) being ideally positioned to lead these efforts. Various technologies, such as mHealth applications, wearable devices [<xref ref-type="bibr" rid="ref5">5</xref>], and social media platforms, can support the delivery of health information. Social media platforms have been widely used for health information delivery as these platforms are accessible to larger populations at a lower cost [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. To effectively promote healthy lifestyle behaviors on social media, HCPs could begin by understanding users&#x2019; current opinions on lifestyle behaviors and whether they are receptive to recommended health practices [<xref ref-type="bibr" rid="ref8">8</xref>]. This could be achieved by examining social media posts discussing on lifestyle behaviors. X (formerly known as Twitter) is one of the microblog-based social media platform that allows users to freely express their opinions through posts, previously referred to as tweets. As of January 2024, approximately 5.71 million social media users in Malaysia were on X, accounting for 16.5% of the country&#x2019;s population [<xref ref-type="bibr" rid="ref9">9</xref>], which highlights the growing popularity of X among Malaysians.</p><p>When users express their opinions in writing on social media, a range of emotions may be conveyed. Sentiment analysis is the process of classifying this textual data based on the emotions conveyed within the text as positive, negative, or neutral sentiments [<xref ref-type="bibr" rid="ref10">10</xref>]. It can be conducted through manual annotation of posts or computational approaches [<xref ref-type="bibr" rid="ref11">11</xref>]. Computational approaches in sentiment analysis are preferred as they are more cost-efficient, and can leverage large amounts of publicly accessible and concise real-time data across different regions and demographics [<xref ref-type="bibr" rid="ref12">12</xref>]. Methodologies of computational approaches include lexicon-based sentiment analysis, which uses pre-existing dictionaries containing words with pre-assigned sentiment scores of positive, negative, or neutral. Lexicon-based sentiment analysis is effective when limited labelled training data is available with a strong association of sentiments with specific words. The usage of this approach has been documented in numerous studies that analyze sentiments regarding lifestyle behaviors such as the examination of policies on electronic cigarettes [<xref ref-type="bibr" rid="ref13">13</xref>], vegan-related posts [<xref ref-type="bibr" rid="ref14">14</xref>], and organic food posts [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Lexicon-based sentiment analysis, however, may have limited coverage in terms of vocabulary and often misses sarcasm or irony [<xref ref-type="bibr" rid="ref16">16</xref>]. Positive sentiments may not necessarily translate to good health practices and vice versa. For example, the sentence &#x201C;I love tobacco&#x201D; showed positive sentiments, but the actual context is related to the user&#x2019;s preference towards unhealthy lifestyle behaviors. In order to further understand the topics communicated on social media and how users&#x2019; perceptions are aligned with recommended health practices, lexicon-based sentiment analysis can be supported with manual content analysis. A codebook can be used to manually assign labels to each post, which will provide a more in-depth analysis of the posts [<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>The examination of social media posts across multiple lifestyle behaviors of tobacco smoking, alcohol consumption, diet, and physical activity could facilitate effective comparisons of findings across these different behaviors. The use of such findings would enable HCPs to use social media to deliver information on healthy behaviors by targeting areas where the lifestyle behaviors are not aligned with recommended health practices. Analyses that are focused within a geographic location would provide opportunities for HCPs to prioritize region-targeted health information delivery on social media. Such health information could also potentially be replicated in other countries with similar digital and health ecosystems.</p><p>Nevertheless, there have been limited studies that used the combined approaches of lexicon-based sentiment and content analysis to examine social media posts on lifestyle behaviors. The majority of the available studies were focused on other health-related issues such as the examination of users&#x2019; perceptions on diabetes [<xref ref-type="bibr" rid="ref18">18</xref>] and marijuana usage [<xref ref-type="bibr" rid="ref19">19</xref>]. A study by Kasson et al [<xref ref-type="bibr" rid="ref20">20</xref>] have used both sentiment analysis and manual content analysis to examine users&#x2019; vaping behaviors. However, the study was confined to vaping behaviors during the e-cigarette or vaping use-associated lung injury outbreak and did not address other lifestyle behaviors. In addition, there is a lack of studies examining the opinions of social media users in Malaysia on lifestyle behaviors, despite the increasing burden of NCDs and the rising prevalence of unhealthy lifestyle behaviors in the country.</p><p>Therefore, this study used a combination of lexicon-based sentiment analysis and manual content analysis to understand the discussions on lifestyle behaviors among social media users in Malaysia. This study had three objectives: (1) to determine the sentiments of social media users in Malaysia regarding lifestyle behaviors, (2) to identify the content of posts and ascertain if users&#x2019; perceptions were aligned with recommended health practices, and (3) to explore the associations between the alignment of users&#x2019; perceptions with recommended health practices and sentiment class.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p><xref ref-type="fig" rid="figure1">Figure 1</xref> shows the overall study methods. In the classification of sentiments in posts, data was scraped from X. Following the manual exclusion of irrelevant posts, the data was cleaned, preprocessed and analyzed for sentiments. Data visualization was subsequently conducted. In the manual content analysis of posts, a random selection of posts with positive and negative sentiments for each lifestyle behavior was manually coded to identify the content of posts and the alignment of users&#x2019; perceptions with recommended health practices. Associations between the alignment of users&#x2019; perceptions and sentiment class were subsequently explored.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overall study methods.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e65835_fig01.png"/></fig></sec><sec id="s2-2"><title>Classification of Sentiments in Posts</title><sec id="s2-2-1"><title>Data Scraping</title><p>The automated process of extracting large amounts of data from X is known as data scraping. All posts with keywords related to the 4 lifestyle behaviors aimed at reducing the 4 key modifiable risk factors for NCDs were scraped. These keywords are related to tobacco and its derivative products, alcohol, dietary, and physical activity. The 4 sets of keywords are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The keywords were derived from published systematic reviews on the management of lifestyle behaviors using social media [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Additional keywords commonly used locally were added upon discussion with all researchers.</p><p>Posts spanning 2 consecutive months were selected. This time frame was deemed to be appropriate, as similar studies analyzing health-related sentiments on the X platform have also utilized data across a 2-month period [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The selection of the 2 consecutive months was conducted by initially scraping all posts from January to December 2022 according to each month. The 2 months with the highest number of posts were from November to December 2022. Post based in Malaysia were determined using longitude and latitude metadata (4.2105&#x00B0;N, 101.9758&#x00B0;E). In terms of language, posts in Malay and English were scraped. Malay is the national language of Malaysia, whereas English is widely spoken and understood by Malaysians. They also use a mix of both languages, resulting in multilingual data.</p><p>Data scraping was conducted separately for each set of keywords using the SNScrape library on Python. In addition to posts, other X metadata such as timestamp, X username, number of reposts, language, and location were also collected.</p></sec><sec id="s2-2-2"><title>Manual Exclusion of Data</title><p>All posts were manually screened by 2 researchers to exclude those not suitable for analysis, with discrepancies resolved among the research team. The exclusion steps were as follows:</p><p>First, the exclusion of posts not from Malaysia&#x2014;During data scraping, longitude and latitude data retained posts located within the coordinates but posted outside of Malaysia, such as parts of Singapore and Thailand. The &#x201C;location&#x201D; metadata was therefore used to manually exclude these posts.</p><p>Second, the exclusion of irrelevant posts&#x2014;Irrelevant posts include posts with different definitions (eg, &#x201C;exercising&#x201D; your rights), posts not related to health care (eg, religious restrictions on alcohol), indecipherable posts and posts made by bots. Bots were verified by manually checking the user&#x2019;s profile for any unusual activity patterns that exhibited automated behavior (eg, high frequency of posts without breaks).</p></sec><sec id="s2-2-3"><title>Data Preprocessing</title><p>Before conducting sentiment analysis, data preprocessing was carried out to ensure that the text data was cleaned, transformed, and prepared for analysis.</p><p>The model selected for sentiment analysis was the Valence Aware Dictionary and Sentiment Reasoner (VADER) on Python. It is a lexicon-based sentiment analysis tool [<xref ref-type="bibr" rid="ref25">25</xref>] that is suitable for analyzing social media posts, generating results with high classification success [<xref ref-type="bibr" rid="ref26">26</xref>]. As VADER is trained for sentiment analysis in English, all posts in Malay and mixed languages were preprocessed and translated into English using the langid and googletrans libraries on Python.</p><p>Other data preprocessing steps (tokenization, lower casing of texts, removal of stop words, html links, numbers, punctuations, emojis, and acronyms) were not executed. This is attributed to the unique advantages of VADER, in which assessment scores would account for capitalism, punctuations, emojis, English acronyms (eg, &#x201C;LOL&#x201D;), and colloquialisms (eg, &#x201C;meh&#x201D;) [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>].</p><p>Following data preprocessing, a word cloud used to provide a visual representation of the words in the overall X dataset.</p></sec><sec id="s2-2-4"><title>Sentiment Analysis</title><p>Computational, lexicon-based sentiment analysis was conducted to determine users&#x2019; sentiments. This approach was selected over manual annotations and other types of computational methods as it is cost-effective and does not require training for large datasets. As it relies on a predefined lexicon, it does not require significant computational resources. For general sentiment analysis, lexicon-based approaches often performs well enough to capture the overall sentiment trends in social media data [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>The posts that have undergone data preprocessing were then analyzed for polarity using VADER. VADER classifies posts into positive, neutral, and negative sentiments. Positive sentiments have a compound score of &#x2265;0.05, neutral sentiments have a score between &#x003E;&#x2212;0.05 and&#x003C;0.05 and negative sentiments have a score of &#x2264;&#x2212;0.05 [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>Computer-assisted translation tools may limit the extent of translation in posts that contain local dialects and slang. The translated posts may become indecipherable, causing them to be classified as having &#x201C;neutral&#x201D; sentiments. For example, &#x201C;x&#x201D; in Malay, which means &#x201C;no&#x201D; in English may not have undergone translation, resulting in sentiments not being classified accurately. Following the first round of sentiment analysis, the structures of the translated posts that were unclear and yielded neutral sentiments were manually improved. The sentiment analysis was then re-run to enhance the robustness of sentiment classification and to reduce the inaccurate labeling of posts.</p></sec></sec><sec id="s2-3"><title>Manual Content Analysis of Posts With Positive and Negative Sentiments</title><p>Sentiment analysis classifies texts according to the emotions conveyed [<xref ref-type="bibr" rid="ref10">10</xref>]. However, there was no further elaboration on the content and whether users&#x2019; perceptions were aligned with recommended health practices.</p><p>Therefore, a sample of posts with positive and negative sentiments were randomly selected for manual content analysis. Stratified sampling was conducted by dividing the posts according to the type of lifestyle behavior and sentiment class (positive or negative). For each type of lifestyle behavior and sentiment class, 20% of the total posts for the particular lifestyle behavior were subjected to random selection. This would allow the posts for each lifestyle behavior to have an equal number of positive and negative sentiments. The random sample of posts was generated by using the random number equation in Microsoft Excel relative to the ID number attached to each post. This approach was adopted from a previous content analysis study on X, which also manually coded a random sample of 20% of total posts [<xref ref-type="bibr" rid="ref30">30</xref>].</p><p>A preliminary codebook with 2 categories was developed through discussions among the research team to classify the content of posts and the alignment of users&#x2019; perceptions with recommended health practices. This codebook is partially adapted from the codes used by Miller et al [<xref ref-type="bibr" rid="ref31">31</xref>]. The recommended health practices are based on WHO&#x2019;s health recommendations [<xref ref-type="bibr" rid="ref32">32</xref>]. In brief, WHO advocates healthy practices, including abstaining from smoking and alcohol consumption, maintaining a balanced diet, and engaging in regular physical activities. The codes were mutually exclusive. Using the preliminary codebook, 100 posts (25 posts for each type of lifestyle behavior) were independently coded by 2 coders. Interrater reliability was conducted to measure the agreement of each post between both coders. The preliminary codebook was refined until a Cohen kappa score of 0.80 was achieved. The remaining posts were then coded independently using the finalized codebook by both coders.</p><p><xref ref-type="table" rid="table1">Table 1</xref> provides a brief description of the codes for the finalized codebook, with a more comprehensive codebook provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Brief description of codes.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">Definition</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Post content (Topical content dealing with the lifestyle behavior mentioned in the post)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Self-narrative of current lifestyle behaviors</td><td align="left" valign="top">Narration of self&#x2019;s current lifestyle behaviors.</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Narrative of others&#x2019; current lifestyle behaviors</td><td align="left" valign="top">Talked about other people&#x2019;s current lifestyle behaviors.</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Planned action related to lifestyle behaviors</td><td align="left" valign="top">A planned action that will be conducted by the person who wrote the post.</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recommendations related to lifestyle behaviors</td><td align="left" valign="top">A recommendation by the person who wrote the post, providing instruction, advice, or suggestion to others.</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Direct question</td><td align="left" valign="top">Direct question used in a post.</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>General statement</td><td align="left" valign="top">General statement that is not under any of the other categories above.</td></tr><tr><td align="left" valign="top" colspan="2">Alignment of users&#x2019; perceptions with recommended health practices (Whether users&#x2019; perceptions in posts are aligned with WHO&#x2019;s health recommendations)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Aligned with recommended health practices</td><td align="left" valign="top">Users agreed with the conduct of recommended health practices, that included not smoking, avoiding alcohol consumption, maintaining a balanced diet and being physically active.</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Not aligned with recommended health practices</td><td align="left" valign="top">Users were not agreeable with the conduct of recommended health practices (eg, consumed oily food, refused to exercise).</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Users&#x2019; perceptions cannot be defined</td><td align="left" valign="top">The perceptions of the user could not be defined or linked with health practices.</td></tr></tbody></table></table-wrap></sec><sec id="s2-4"><title>Data Analysis</title><p>Data analysis was performed using descriptive statistics with all variables expressed in frequencies and percentages. The Pearson chi-square test was used to compare the associations between the categorical variables, with <italic>P</italic> values &#x003C;.05 considered to be statistically significant. IBM SPSS Statistics version 26.0 was used for data analysis.</p><p>Findings were also visualized using a word cloud and bar charts. In addition, examples of posts were provided to describe the study findings.</p></sec><sec id="s2-5"><title>Ethical Considerations</title><p>This study was approved by the Medical Research and Ethics Committee, Ministry of Health Malaysia (NMRR ID-23&#x2010;00293-CIM [IIR]) on March 23, 2023, and the Research Ethics Committee, Universiti Kebangsaan Malaysia (UKM PPI/111/8/JEP-2023&#x2010;174) on April 13, 2023.</p><p>As this study relied solely on publicly available social media data on X and did not involve direct interaction with individuals, informed consent was not applicable. No compensation was offered or provided, as the study did not involve direct participation of human participants.</p><p>No identifiable private user information was collected or analyzed. All data used in the analysis were publicly available and did not contain personally identifiable information.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview of X Dataset</title><p><xref ref-type="fig" rid="figure2">Figure 2</xref> shows the flowchart of the selection of the X dataset.</p><p>A total of 9581 posts were scraped from November to December 2022. Following the exclusion of 3047 posts that were not in Malaysia and 3214 irrelevant posts, 3320 posts across 4 types of lifestyle behaviors were retained for sentiment analysis. Almost half of the posts were dietary-related (1530/3320, 46.1%), followed by activity-related (810/3320, 24.4%) and tobacco-related (700/3320, 21.1%) posts. Alcohol-related posts were present in only one-tenth of the posts (280/3320, 8.4%).</p><p>As data scraping was conducted separately for each lifestyle behavior, a post may appear more than two times across different behaviors. Out of the 3320 posts, 3180 (95.8%) posts showed 1 lifestyle behavior only. There were 140 posts with two types of lifestyle of behaviors mentioned, with three-quarters (104/140, 74.3%) of posts mentioning both dietary- and activity-related behaviors.</p><p>A word cloud was used to visualize the overall X dataset (n=3320; see <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). Overall, the 5 terms most commonly mentioned by users were &#x201C;diet,&#x201D; &#x201C;rice,&#x201D; &#x201C;eat,&#x201D; &#x201C;sugar,&#x201D; and &#x201C;smoke.&#x201D;</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Flowchart of selection of X dataset. Examples of irrelevant posts include (1) tobacco-related posts: gaming-type of posts (eg, smoke mentioned in a game), music band names (eg, Cigarettes After Sex), tweet mentioning terms as a location (eg, Hookah Island, Vape Shop); (2) alcohol-related posts: banning alcohol due to religion with no links to health (eg, at Qatar for the World Cup), sarcasm-based (eg, &#x201C;you must be drunk,&#x201D; which translates to &#x201C;you must be kidding me&#x201D;); (3) dietary-related posts: nephew in Malay (eg, anak buah), nonhealth posts (eg, fruit on the trees or plants, sugar daddy); (4) activity-related posts: posts mentioning terms as a location (eg, Sports Direct), nonhealth posts (eg, who will be Sports Minister?, &#x201C;exercising&#x201D; your rights). With regard to posts overlapping lifestyle behaviors, as data scraping was conducted separately for each lifestyle behavior, a post may appear more than 2 times across different behaviors (eg, the post talks about both smoking and dietary habits).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e65835_fig02.png"/></fig></sec><sec id="s3-2"><title>Findings From Classification of Sentiments in Posts</title><p><xref ref-type="table" rid="table2">Table 2</xref> presents the frequency distribution of sentiment analysis, with examples for each lifestyle behavior provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p><p>The overall percentage of positive sentiments almost doubled that of negative sentiments (1874/3320, 56.5%) vs (1027/3320, 30.9%). Results have shown a significant association between sentiment class and lifestyle behaviors (<italic>&#x03C7;</italic><sup>2</sup><sub>6</sub>=67.64; <italic>P</italic>&#x003C;.001), with positive sentiments being higher than negative sentiments for all lifestyle behaviors. The trends for dietary- and activity-related posts were similar, with both showing approximate percentages of 60% for positive sentiments and 27% for negative sentiments. This was followed by alcohol-related posts with positive sentiments of 54.7% (153/280). Less than half of tobacco-related posts (314/700, 44.9%) had positive sentiments, with the percentage differences between sentiment classes slightly below 2%.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Frequency distribution of sentiment analysis before and after structure improvement of posts using Valence Aware Dictionary and Sentiment Reasoner (VADER; n=3320).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Lifestyle behaviors</td><td align="left" valign="bottom" colspan="3">Sentiment count before structure improvement of posts, n (%)</td><td align="left" valign="bottom" colspan="3">Sentiment count after structure improvement of posts, n (%)<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="bottom">Total, n</td></tr><tr><td align="left" valign="top"/><td align="left" valign="bottom">Positive</td><td align="left" valign="bottom">Neutral</td><td align="left" valign="bottom">Negative</td><td align="left" valign="bottom">Positive</td><td align="left" valign="bottom">Neutral</td><td align="left" valign="bottom">Negative</td><td align="left" valign="top"/></tr></thead><tbody><tr><td align="left" valign="top">Tobacco-related posts</td><td align="left" valign="top">254 (36.3)</td><td align="left" valign="top">197 (28.1)</td><td align="left" valign="top">249 (35.6)</td><td align="left" valign="top">314 (44.9)</td><td align="left" valign="top">84 (12)</td><td align="left" valign="top">302 (43.1)</td><td align="left" valign="top">700</td></tr><tr><td align="left" valign="top">Alcohol-related posts</td><td align="left" valign="top">120 (42.9)</td><td align="left" valign="top">95 (33.9)</td><td align="left" valign="top">65 (23.2)</td><td align="left" valign="top">153 (54.7)</td><td align="left" valign="top">41 (14.6)</td><td align="left" valign="top">86 (30.7)</td><td align="left" valign="top">280</td></tr><tr><td align="left" valign="top">Dietary-related posts</td><td align="left" valign="top">724 (47.3)</td><td align="left" valign="top">455 (29.7)</td><td align="left" valign="top">351 (23)</td><td align="left" valign="top">916 (59.9)</td><td align="left" valign="top">197 (12.9)</td><td align="left" valign="top">417 (27.2)</td><td align="left" valign="top">1530</td></tr><tr><td align="left" valign="top">Activity-related posts</td><td align="left" valign="top">378 (46.7)</td><td align="left" valign="top">246 (30.4)</td><td align="left" valign="top">186 (22.9)</td><td align="left" valign="top">491 (60.6)</td><td align="left" valign="top">97 (12)</td><td align="left" valign="top">222 (27.4)</td><td align="left" valign="top">810</td></tr><tr><td align="left" valign="top">Total</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">1874 (56.5)</td><td align="left" valign="top">419 (12.6)</td><td align="left" valign="top">1027 (30.9)</td><td align="left" valign="top">3320</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Sentiment count after structure improvement of posts were used for analysis. A Pearson chi-square test was conducted to test the associations between sentiment class and lifestyle behaviors (<italic>&#x03C7;</italic><sup>2</sup><sub>6</sub>=67.64, <italic>P</italic>&#x003C;.001).</p></fn><fn id="table2fn2"><p><sup>b</sup>Not applicable.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Findings From Manual Content Analysis of Posts</title><p>A total of 1328 posts with an equal number of positive and negative sentiments for each lifestyle behavior were selected for manual content analysis. They comprised of 280 tobacco-related posts (140 posts for each sentiment class), 112 alcohol-related posts (56 posts for each sentiment class), 612 dietary-related posts (306 posts for each sentiment class), and 324 activity-related posts (162 posts for each sentiment class).</p><p>Prior to the manual content analysis of all 1328 posts, 100 posts were first subjected to interrater reliability testing. The Cohen kappa scores for both categories of post content and the alignment of users&#x2019; perceptions with recommended health practices were 0.807 and 0.801, respectively.</p><p>The frequency of posts is tabulated in <xref ref-type="table" rid="table3">Table 3</xref>. Overall, the content with the 3 highest number of posts were self-narratives of current lifestyle behaviors (492/1328, 37%), general statements (203/1328, 15.3%) and planned actions (196/1328, 14.8%). Self-narratives were the most popular content for all types of lifestyle behaviors except for tobacco-related posts, in which the majority were narratives of others&#x2019; current behaviors (96/280, 34.3%). Question-based posts were the least popular content for tobacco-, alcohol-, and activity-related posts, with less than 10% present in all types. Users&#x2019; perceptions in more than half of the posts were aligned with recommended health practices (769/1328, 57.9%). Similar proportions were observed for all types of lifestyle behaviors except for alcohol-related posts, in which posts not aligned with recommended health practices were double those aligned with recommended health practices (63/112, 56.3% vs 33/112, 29.4%).</p><p><xref ref-type="fig" rid="figure3">Figure 3</xref> shows the frequency of posts that demonstrated the alignment of users&#x2019; perceptions with recommended health practices according to the sentiment classification. A total of 3 main findings were observed. First, in dietary- and activity-related posts, significant associations between sentiment class and alignment of users&#x2019; perceptions with recommended health practices were observed (<italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=30.98, <italic>P</italic>&#x003C;.001 and <italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=24.16, <italic>P</italic>&#x003C;.001; respectively). In both positive and negative sentiment classes, the percentages of posts aligned with recommended health practices were significantly higher than those not aligned with recommended health practices and those with undefined user perceptions, with percentages ranging from 49.3% to 80.2%. Posts with positive sentiments that aligned with recommended healthy practices showcased users&#x2019; optimism to stay healthy (eg, &#x201C;I&#x2019;m ready to cut sugar. Let&#x2019;s go&#x201D; [D-919-positive]). Meanwhile, negative sentiments that aligned with recommended healthy practices highlighted users&#x2019; worries to stay healthy (eg, &#x201C;Feel the weight.. rise suddenly. Sad. Have to fix it&#x201D; [P-522-negative]).</p><p>Second, in tobacco-related posts, there was no significant association between sentiment class and alignment of users&#x2019; perceptions with recommended health practices (<italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=5.76; <italic>P</italic>=.06). Among posts with positive sentiments, the percentage of posts that aligned with recommended health practices was similar to those not aligned with recommended health practices, with a percentage difference of 7.1%. When users posted about tobacco with positive emotions, the likelihood of their perceptions aligning with the recommended health practices of not smoking (eg, &#x201C;Please pray that I can stop smoking&#x2026;&#x201D; [T-563-positive]) or aligning with hazardous smoking practices (eg, &#x201C;My kind of chill with cigar&#x201D; [T-412-positive]) were similar. Despite the lack of significant association, the percentage of posts with negative sentiments that aligned with recommended health practices was noticeably higher than those that did not align with recommended health practices (86/140, 61.4% vs 41/140, 29.3%).</p><p>Third, a lack of significant association between sentiment class and alignment of users&#x2019; perceptions with recommended health practices was also observed in alcohol-related posts (<italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=4.62; <italic>P</italic>=.10). Although the findings were not statistically significant, the percentage of posts not aligned with recommended health practices was higher than those aligned with recommended health practices for both positive (37/56, 66.1% vs 12/56, 21.4%) and negative (26/56, 46.4% vs 21/56, 37.5%) sentiment classes. Positive sentiments leading to alcohol consumption included celebratory posts (eg, &#x201C;I&#x2019;m gonna have so much wine this weekend&#x201D; [A-55-positive]), whereas negative sentiments involved users coping with worries (&#x201C;I am going to drown my sorrows in alcohol and pick things back up tomorrow&#x201D; [A-198-negative]). Examples of posts selected for manual content analysis are provided in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Frequency of posts according to post content and alignment of users&#x2019; perceptions with recommended health practices (n=1328).</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom" colspan="4">Lifestyle behaviors</td><td align="left" valign="bottom">Total posts (N=1328)</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Tobacco-related (n=280)</td><td align="left" valign="bottom">Alcohol-related (n=112)</td><td align="left" valign="bottom">Dietary-related (n=612)</td><td align="left" valign="bottom">Activity-related (n=324)</td><td align="left" valign="bottom"/></tr></thead><tbody><tr><td align="left" valign="top" colspan="6">Post content, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Self-narrative of current lifestyle behaviors</td><td align="left" valign="top">70 (25)</td><td align="left" valign="top">36 (32.1)</td><td align="left" valign="top">243 (39.7)</td><td align="left" valign="top">143 (44.1)</td><td align="left" valign="top">492 (37)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Narrative of others&#x2019; current lifestyle</td><td align="left" valign="top">96 (34.3)</td><td align="left" valign="top">17 (15.2)</td><td align="left" valign="top">40 (6.5)</td><td align="left" valign="top">22 (6.8)</td><td align="left" valign="top">175 (13.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Planned action related to lifestyle behaviors</td><td align="left" valign="top">26 (9.3)</td><td align="left" valign="top">15 (13.4)</td><td align="left" valign="top">97 (15.8)</td><td align="left" valign="top">58 (17.9)</td><td align="left" valign="top">196 (14.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recommendations related to lifestyle behaviors</td><td align="left" valign="top">35 (12.5)</td><td align="left" valign="top">13 (11.6)</td><td align="left" valign="top">83 (13.6)</td><td align="left" valign="top">46 (14.2)</td><td align="left" valign="top">177 (13.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Direct question</td><td align="left" valign="top">17 (6.1)</td><td align="left" valign="top">6 (5.4)</td><td align="left" valign="top">45 (7.4)</td><td align="left" valign="top">17 (5.3)</td><td align="left" valign="top">85 (6.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>General statement</td><td align="left" valign="top">36 (12.8)</td><td align="left" valign="top">25 (22.3)</td><td align="left" valign="top">104 (17)</td><td align="left" valign="top">38 (11.7)</td><td align="left" valign="top">203 (15.3)</td></tr><tr><td align="left" valign="top" colspan="6">Alignment of users&#x2019; perceptions with recommended health practices, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Aligned with recommended health practices</td><td align="left" valign="top">152 (54.3)</td><td align="left" valign="top">33 (29.4)</td><td align="left" valign="top">365 (59.7)</td><td align="left" valign="top">219 (67.6)</td><td align="left" valign="top">769 (57.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Not aligned with recommended health practices</td><td align="left" valign="top">97 (34.6)</td><td align="left" valign="top">63 (56.3)</td><td align="left" valign="top">147 (24)</td><td align="left" valign="top">55 (17)</td><td align="left" valign="top">362 (27.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Users&#x2019; perceptions cannot be defined</td><td align="left" valign="top">31 (11.1)</td><td align="left" valign="top">16 (14.3)</td><td align="left" valign="top">100 (16.3)</td><td align="left" valign="top">50 (15.4)</td><td align="left" valign="top">197 (14.8)</td></tr></tbody></table></table-wrap><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Stacked bar charts of alignment of users&#x2019; perceptions with recommended health practices stratified according to sentiment classification. A Pearson chi-square test was conducted for each lifestyle behavior to test the associations between sentiment class and alignment of users&#x2019; perceptions with recommended health practices (tobacco: <italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=5.76, <italic>P</italic>=.06; alcohol: <italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=4.62, <italic>P</italic>=.10; dietary: <italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=30.98, <italic>P&#x003C;</italic>.001; activity: <italic>&#x03C7;</italic><sup>2</sup><sub>2</sub>=24.16, <italic>P&#x003C;</italic>.001).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e65835_fig03.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Overview</title><p>To the best of our knowledge, this is the first study in the region that examined discussions on X across multiple lifestyle behaviors. This study is also the first of its kind that used dual approaches of lexicon-based sentiment analysis and manual content analysis of posts to examine users&#x2019; sentiments, post content and the alignment of users&#x2019; perceptions with recommended health practices. Positive sentiments were significantly higher than negative sentiments for all 4 lifestyle behaviors. In dietary- and activity-related posts, users exhibited twice as many positive sentiments as negative ones. The majority of the sampled posts were self-narratives of current lifestyle behaviors. More than half of the sampled tobacco-, dietary-, and activity-related posts were aligned with WHO&#x2019;s recommended health practices, with contrasting results in alcohol-related posts.</p></sec><sec id="s4-2"><title>Principal Findings</title><p>Data scraping has shown that dietary-related topics were the lifestyle behaviors most frequently discussed. The usage of a more extensive set of search terms in scraping dietary-related posts covered a variety of nutrition-based topics involving individuals across all age groups. This resulted in dietary-related discourses among young children and adolescents (eg, formula milk, vegetables, and fruits consumption). Users frequently mentioned &#x201C;rice,&#x201D; which is attributed to Malaysians&#x2019; staple diet, with the average Malaysian adult consuming 82.3 kilograms of rice annually [<xref ref-type="bibr" rid="ref33">33</xref>]. In contrast, alcohol-related topics were the least discussed lifestyle behaviors among users. Alcohol-related discussions in Malaysia were largely anchored on themes related to cultural and religious beliefs. Alcohol consumption among Malaysians is generally lower as behaviors are influenced by compartmentalization among the three main races in Malaysia [<xref ref-type="bibr" rid="ref34">34</xref>]. Malays who are Muslims are not allowed to consume alcohol as it is forbidden in Islam [<xref ref-type="bibr" rid="ref35">35</xref>], whereas no restrictions were imposed on the Chinese and Indian communities [<xref ref-type="bibr" rid="ref34">34</xref>]. The prohibition of alcohol consumption in certain communities was hypothesized as one of the reasons for the lower frequency of alcohol-related posts, compared to other lifestyle behaviors.</p><p>Findings indicate that positive sentiments significantly outweighed negative sentiments for all lifestyle behaviors. In dietary- and activity-related posts, positive sentiments were found to be twice as many as negative sentiments, which is consistent with the sentiment analysis findings of Shaw et al [<xref ref-type="bibr" rid="ref36">36</xref>] who analyzed over 1.5 million posts on dietary and exercise topics. In our study, more than half of the sampled posts were either self-narratives or planned actions for self-implementation. It could be postulated that the posts with positive sentiments were driven by self-determination theory (SDT), a comprehensive theory of human motivation and personality that focuses on individuals&#x2019; intrinsic tendencies for growth. SDT assumes the importance of autonomous motivation, which is a type of self-emanating motivation that is consistent with users&#x2019; innate values to engage in behaviors or pursue a goal [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. The field of autonomous motivation has been extensively studied in the context of dietary and exercise lifestyle behaviors [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>]. Individuals who are autonomously motivated have a sense of self-control over their actions (eg, choose to exercise regularly), leading to an increase in positive sentiments, personal fulfilment and enjoyment in the actions pursued [<xref ref-type="bibr" rid="ref40">40</xref>].</p><p>In tobacco-related posts, positive sentiments were found to be higher than negative sentiments, albeit with a small percentage difference. This suggests that in tobacco-related discourses, users tend to either feel positive emotions (eg, satisfaction, happiness, and trust) or negative emotions (eg, dissatisfaction, unhappiness, and worry). Mixed sentiments were found to be prevalent in discussions related to vaping among both the scientific community [<xref ref-type="bibr" rid="ref42">42</xref>], and the general public [<xref ref-type="bibr" rid="ref43">43</xref>]. In Malaysia, the Health Ministry has proposed the Generational End Game plan, which would ban tobacco sales for those born after 2005. The bill was first tabled at the country&#x2019;s parliamentary discussions in July 2022 and has yet to be finalized at the time when the social media posts were scraped from X [<xref ref-type="bibr" rid="ref44">44</xref>]. Such uncertainties towards health policy changes have generated both positive and negative reactions, with the issue being debated constantly throughout the year. Users either praised the government&#x2019;s efforts to mitigate smoking behaviors or expressed concerns about such &#x201C;untested&#x201D; plans [<xref ref-type="bibr" rid="ref45">45</xref>]. The negative reactions may also stemmed from users&#x2019; awareness of the adverse effects of smoking, with over 90% of male lung cancer patients in Malaysia having a significant history of smoking [<xref ref-type="bibr" rid="ref46">46</xref>]. In addition, 3500 out of 10,000 annual deaths were linked to smoking [<xref ref-type="bibr" rid="ref47">47</xref>].</p><p>As discussed, the predominance of self-narratives in posts related to diet, physical activity and alcohol consumption is likely due to users&#x2019; autonomous motivation and self-awareness to perform a behavior. Conversely, most posts related to tobacco were found to be linked to narratives of other users. As tobacco smoking has been associated with social stigmatization due to its negative health impact on others, users may have been more reluctant to post from a first-person perspective. Instead, users opt to openly discuss the smoking habits of others. In addition, sharing experiences in a third-person perspective may be preferred by users to maintain anonymity. During the 20th century, smokers were often viewed as &#x201C;mysterious&#x201D; or &#x201C;cool,&#x201D; but this social status has slowly diminished over the past two decades [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]. In Malaysia, this was propelled by smoking reduction strategies, such as the ban on smoking in public eateries implemented in 2019, that socially impacted users&#x2019; impression toward smoking [<xref ref-type="bibr" rid="ref50">50</xref>].</p><p>In recent years, there has been a growing trend of health influencers using online platforms to actively share their dietary and fitness regimens. Previous studies have shown that social media users who were exposed to this information delivered by health influencers as well as content from other social media users, were more likely to be receptive to adopting healthy practices, such as maintaining a balanced diet and being physically active [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>]. The results were consistent with the findings of this study, which showed a significantly higher percentage of dietary- and activity-related posts by social media users that were aligned with recommended health practices. Nevertheless, HCPs must remain active in advocating positive lifestyle behaviors on social media. Although almost one-fifth of posts for these two lifestyle behaviors were on planned actions, this may not always translate into actions by the population. This is a caveat of much research that relies on social media or self-reported data on social media. It is often unclear whether individuals actually follow through on what they post about, highlighting the intention-behavior gap [<xref ref-type="bibr" rid="ref54">54</xref>]. Findings from the Malaysian National Health and Morbidity Survey (NHMS) survey conducted in 2023 have shown that the actual adoption of healthy practices was still lacking among the Malaysian public. Almost 95.1% Malaysian adults did not meet the recommended daily intake of fruits and vegetables, consuming only two servings of fruit or vegetables daily instead of the recommended five servings daily [<xref ref-type="bibr" rid="ref3">3</xref>] The prevalence of physical inactivity among Malaysian adults was at 29.9% [<xref ref-type="bibr" rid="ref3">3</xref>], which was also considerably higher than other Asian countries, including China and India [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref56">56</xref>].</p><p>There was a lack of significant association between sentiment class and alignment with recommended health practices in both tobacco- and alcohol-related posts. Despite the smaller number of sampled alcohol-related posts, it is interesting to note that users&#x2019; perceptions with recommended health practices had contrasting outcomes compared to the other three lifestyle behaviors. In more than half of the alcohol-related posts with positive and negative sentiments, users&#x2019; perceptions were not aligned with recommended health practices. Most users perceived alcohol consumption as a casual and an affordable social activity and did not acknowledge the potential health risks involved. A survey conducted in Thailand, a country of similar income setting, had previously mentioned the popularity of alcohol being a social activity among urban communities [<xref ref-type="bibr" rid="ref57">57</xref>]. In Malaysia, alcoholic beverages were available for purchase at neighborhood convenience stores, which allowed for easy purchases of takeaway alcohol [<xref ref-type="bibr" rid="ref35">35</xref>]. This further downplayed users&#x2019; awareness of the negative consequences of alcohol consumption [<xref ref-type="bibr" rid="ref58">58</xref>].</p><p>Assessment of posts made by social media users on X allows HCPs to identify priority areas for social media-based health information delivery on this platform. As most alcohol-related posts do not align with health recommendations, it is postulated that greater emphasis should be placed on strategies to limit alcohol consumption among users in Malaysia. The WHO has proposed collaborative efforts with HCPs and journalists to improve targeted public health messaging to the public. A guide was recently developed for journalists to facilitate media reporting to communities on the harms of alcohol consumption [<xref ref-type="bibr" rid="ref58">58</xref>]. While the other 3 lifestyle behaviors were mostly aligned with recommended health practices, it remains essential for HCPs to continuously deliver information advocating healthy behaviors. Online approaches allow HCPs to deliver information beyond geographic barriers, reaching a wider audience in diverse community settings. Therefore, health information can be adopted by users in countries with similar cultural beliefs, including countries within the Southeast Asia region.</p></sec><sec id="s4-3"><title>Strengths and Limitations</title><p>The strengths of this study included its comprehensive coverage of 4 lifestyle behaviors aimed at reducing the 4 key modifiable risk factors under WHO&#x2019;s health priority [<xref ref-type="bibr" rid="ref4">4</xref>]. This allowed for the simultaneous analysis of posts across different lifestyle behaviors. Unlike most studies that focus on global contexts, this research uniquely focused on the Malaysian context. It provides insights into the cultural and social dynamics that influence discussions around lifestyle behaviors in this specific region. Notably, the inclusion of alcohol-related posts in analysis shed light on culturally and socially nuanced discussions within the region. This is particularly valuable in regions like Malaysia, where religious and cultural factors strongly influence alcohol consumption. In addition, the retrospective examination of social media posts utilized approaches of lexicon-based sentiment analysis and manual content analysis. The dual approach provided real-time and spontaneous insights into users&#x2019; opinions on lifestyle behaviors while addressing limitations of single-method studies. Findings from this study could assist HCPs in prioritizing the delivery of region-specific health information through social media.</p><p>Nevertheless, a few limitations should be considered. First, potential bias may exist during the selection of social media dataset. In self-selection bias, users who choose to share their opinions on social media may not represent the broader population. The study may be subjected to data selection bias as it included only social media posts in Malay and English, excluding other spoken languages in Malaysia, such as Chinese and Tamil. Nevertheless, sentiment analysis studies on X in Malaysia have largely concentrated on data scraped in Malay and English [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>]. Demographic bias may be present due to the overrepresentation or underrepresentation of certain groups on X. For instance, the majority of users in Malaysia who post on social media are aged between 25 and 34 years old [<xref ref-type="bibr" rid="ref9">9</xref>]. The limitations in the availability of metadata on X also prevented the collection of demographic data such as age, gender and race, as most users did not disclose this information in their profiles. Population bias may occur in geotagged posts utilizing longitude and latitude metadata. Previously literature has indicated that only 1% of users would geotag their location in posts [<xref ref-type="bibr" rid="ref61">61</xref>]. Nevertheless, this is the most effective method to scrape posts that are published within a specific location.</p><p>Second, there are limitations in the study design and methods used for sentiment analysis and manual content analysis. The study is cross-sectional in nature and provides a snapshot of discussions at a specific time. Therefore, temporal bias may exist, making it challenging to track changes in sentiments or behaviors over time. In addition, posts that were collected for sentiment analysis and manual content analysis over two consecutive months may not accurately reflect year-round sentiments and discussions, as findings may vary due to the presence of health-related events occurring at certain times of the year. The events may include a change in legislations, prominent public health campaigns or disease outbreaks. The quality of the dataset was ensured by verifying that there were no notable health-related occurrences between November and December 2022. In addition, previous studies analyzing users&#x2019; sentiments and content have similarly explored health data over two consecutive months [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The manual content analysis of social media posts can be time-consuming due to the involvement of large datasets, therefore, only 20% of the total posts were randomly selected using stratified sampling. This percentage was previously utilized in a content analysis study by Mathieson et al [<xref ref-type="bibr" rid="ref30">30</xref>]. While analyzing the full dataset would provide more comprehensive findings, the randomized sample offers a reliable snapshot for identifying the thematic content without the substantial time and resource demands of manual analysis for the entire dataset. Furthermore, prior to sentiment analysis, the computer-assisted translation of posts from Malay to English may have led to inaccuracies due to the usage of local dialects, sarcasm or slangs. To enhance sentiment labeling, the structures of translated posts with neutral sentiments that were unclear were manually refined, and sentiment analysis was repeated.</p><p>Third, the study results should be interpreted with caution, regarding posts on alcohol consumption due to the smaller sample size of 112 posts. A power analysis indicated that this sample size is adequate for detecting effects, with a power of 0.82. Furthermore, we acknowledge the presence of potential interactions in posts with overlapping lifestyle behaviors (eg, a post that talks about diet and physical activity). In sentiment analysis, the conduct of Pearson chi-square tests also did not account for potential confounding factors or interactions in posts with overlapping lifestyle behaviors. To account for this limitation, we compared the proportions between sentiment count for posts showing 1 lifestyle behavior only (n=3180), and sentiment count for posts across 4 types of lifestyle behaviors (n=3320). The proportions of sentiment counts for both were similar to each other. In addition, while many of the Pearson chi-square associations were significant, these may not imply causality and thus may not inform categorically that the observed sentiments result in practicing different lifestyle behaviors or the direction of the relationship.</p></sec><sec id="s4-4"><title>Implications and Further Research</title><p>The findings from this study could help HCPs to prioritize the delivery of health information on lifestyle behaviors using social media tailored to the targeted region, which is Malaysia. Given the low number of alcohol-related posts by social media users in Malaysia, HCPs could focus on initiating positive discussions around this topic to raise awareness about the harmful effects of alcohol consumption. In addition, most of the alcohol-related posts made by social media users were not aligned with recommended health practices. There is an increased need for HCPs to emphasize on limiting and stopping alcohol consumption, while also acknowledging that the users&#x2019; attitudes towards alcohol consumption may still vary among different religions in Malaysia. Health advocacy for positive lifestyle behaviors on social media should continue for the other three lifestyle behaviors.</p><p>Further research could be proposed to explore the opinions of social media users toward lifestyle behaviors in Malaysia. First, despite the statistical significance observed in the associations between sentiment classification and lifestyle behaviors, the percentage difference between both sentiment classes in tobacco-related posts was small. Therefore, it would be interesting to investigate whether tobacco sentiments would vary over time. We may want to further track sentiments by time series analysis to explore changes in users&#x2019; emotions towards tobacco across a time period. The tracking of real-time sentiments across a time period was previously conducted in a review examining public health data on X that included posts on alcohol consumption [<xref ref-type="bibr" rid="ref62">62</xref>]. In addition, since posts are scraped based on location metadata, future studies could leverage on this data to explore the relationship between the prevalence of specific lifestyle behaviors in certain locations (eg, urban areas in Malaysia) and the intensity of lifestyle behavior-related discussions on social media. A similar study has previously been conducted in the United States; therefore, conducting such studies in the Malaysian context would be beneficial [<xref ref-type="bibr" rid="ref63">63</xref>].</p><p>Second, the majority of posts involved content related to self-narratives of lifestyle behaviors. These self-narratives outlined X&#x2019;s roles as a microblog for users to freely express the behaviors they practice from a first-person perspective. As self-narratives encompass a broad and generalized category, it may be beneficial to conduct a more detailed examination of posts that only described users&#x2019; self-narratives. This in-depth analysis would provide insights into the specific themes commonly discussed by users from a first-person perspective. In addition, the examination of posts could be extended to other lifestyle behaviors such as sleep patterns, which is particularly relevant as active social media users are mainly adolescents and young adults who are commonly affected by sleep-related issues [<xref ref-type="bibr" rid="ref64">64</xref>].</p><p>Third, this study was conducted on the microblogging platform X. It is also important to examine social media posts made by users on other platforms, such as Facebook. Future research is proposed to analyze the sentiments and content of posts on these platforms. Audience demographics can vary across these platforms. For instance, younger millennials may be more active on X, whereas Facebook often attracts a slightly older audience [<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref66">66</xref>]. Comparing our study findings with those obtained from Facebook could help HCPs to deliver health messages that suit the audiences of different social media platforms.</p><p>Fourth, our study emphasizes accessibility and simplicity in data visualization and reporting to effectively communicate findings to a diverse audience, including non-technical stakeholders such as HCPs, public health practitioners and policymakers. To achieve this, we employed techniques like word clouds, which provide a visually appealing representation of frequently mentioned terms in the dataset, and lexicon-based sentiment analysis, which is straightforward to implement as it does not require additional labeled data or extensive training. We recognize the potential value of more advanced methods and suggest exploring these techniques in future studies related to the conduct of in-depth text analysis. These may include approaches like topic modeling or keyword co-occurrence analysis to summarize text data through word groups, as well as training machine learning models such as support vector machines or Na&#x00EF;ve Bayes to classify sentiments. Furthermore, hybrid methods of sentiment analysis could be explored by integrating machine learning models with lexicon-based approaches. These combined models can then be assessed for accuracy and robustness through comparative analysis. Similar studies have been conducted previously in both health and non-health posts [<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref68">68</xref>].</p></sec><sec id="s4-5"><title>Conclusion</title><p>In conclusion, the incorporation of lexicon-based sentiment analysis holds significance as it enabled the use of large amounts of data to capture users&#x2019; emotions whilst posting on lifestyle behaviors. Positive sentiments were significantly expressed in posts for all lifestyle behaviors. Nevertheless, there was a small percentage difference observed in tobacco-related posts, indicating a more varied sentiment among users. Most of the posts showed users&#x2019; own narratives and planned actions towards the conduct of a behavior. As the majority of alcohol-related discussions were not aligned with recommended health practices, this reflects the need for individual HCPs and health organizations to increase their delivery of health information pertaining to alcohol consumption on social media platforms. It is also equally important for HCPs to continue providing health information on other lifestyle behaviors to social media users, while monitoring ongoing discussions by users on social media.</p></sec></sec></body><back><ack><p>The authors would like to thank the director-general of Health Malaysia for his permission to publish this article. The work was supported by the Ministry of Higher Education of Malaysia&#x2019;s Fundamental Research Grant Scheme under grant FRGS/1/2020/SS0/UKM/02/11. The funders played no role in study design, collection, analysis, interpretation of data, or writing of the report.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>YYY, MRY, and WWC contributed to the conception or design of the study. YYY and MIAL contributed to data collection of the study. YYY, MIAL, and WWC contributed to data analysis of the study. All authors (YYY, MRY, MM-B, MIAL, and WWC) contributed to data interpretation and provided scientific inputs and technical improvement. YYY drafted the manuscript while MRY and WWC guided the revisions. All authors (YYY, MRY, MM-B, MIAL, and WWC) read and approved the final version for publication.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">HCP</term><def><p>health care professional</p></def></def-item><def-item><term id="abb2">NCD</term><def><p>noncommunicable disease</p></def></def-item><def-item><term id="abb3">NHMS</term><def><p>National Health and Morbidity Survey</p></def></def-item><def-item><term id="abb4">SDT</term><def><p>self-determination theory</p></def></def-item><def-item><term id="abb5">VADER</term><def><p>Valence Aware Dictionary and Sentiment Reasoner</p></def></def-item><def-item><term id="abb6">WHO</term><def><p>World Health Organization</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>Noncommunicable diseases</article-title><source>World Health Organization</source><year>2022</year><access-date>2022-12-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/news-room/fact-sheets/detail/noncommunicable-diseases">https://www.who.int/news-room/fact-sheets/detail/noncommunicable-diseases</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="book"><source>Malaysian Burden of Disease and Injury Study 2009-2014</source><year>2017</year><access-date>2022-12-06</access-date><publisher-name>Institute for Public Health</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://iku.moh.gov.my/images/IKU/Document/REPORT/BOD/BOD2009-2014.pdf">https://iku.moh.gov.my/images/IKU/Document/REPORT/BOD/BOD2009-2014.pdf</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="book"><source>National Health and Morbidity Survey (NHMS) 2023: Non-Communicable Diseases and Healthcare Demand</source><year>2024</year><access-date>2024-05-24</access-date><publisher-name>Institute for Public Health</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://iku.nih.gov.my/images/nhms2023/key-findings-nhms-2023.pdf">https://iku.nih.gov.my/images/nhms2023/key-findings-nhms-2023.pdf</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="web"><article-title>Reducing modifiable risk factors for noncommunicable diseases</article-title><source>World Health Organization</source><year>2022</year><access-date>2022-12-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/westernpacific/activities/reducing-modifiable-risk-factors-for-noncommunicable-diseases">https://www.who.int/westernpacific/activities/reducing-modifiable-risk-factors-for-noncommunicable-diseases</ext-link></comment></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Miyamoto</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Henderson</surname><given-names>S</given-names> </name><name name-style="western"><surname>Young</surname><given-names>HM</given-names> </name><name name-style="western"><surname>Pande</surname><given-names>A</given-names> </name><name name-style="western"><surname>Han</surname><given-names>JJ</given-names> </name></person-group><article-title>Tracking health data is not enough: a qualitative exploration of the role of healthcare partnerships and mhealth technology to promote physical activity and to sustain behavior change</article-title><source>JMIR Mhealth Uhealth</source><year>2016</year><month>01</month><day>20</day><volume>4</volume><issue>1</issue><fpage>e5</fpage><pub-id pub-id-type="doi">10.2196/mhealth.4814</pub-id><pub-id pub-id-type="medline">26792225</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Islam</surname><given-names>SMS</given-names> </name><name name-style="western"><surname>Tabassum</surname><given-names>R</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>The role of social media in preventing and managing non-communicable diseases in low-and-middle income countries: Hope or hype?</article-title><source>Health Policy Technol</source><year>2019</year><month>03</month><volume>8</volume><issue>1</issue><fpage>96</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.1016/j.hlpt.2019.01.001</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ventola</surname><given-names>CL</given-names> </name></person-group><article-title>Social media and health care professionals: benefits, risks, and best practices</article-title><source>P T</source><year>2014</year><month>07</month><volume>39</volume><issue>7</issue><fpage>491</fpage><lpage>520</lpage><pub-id pub-id-type="medline">25083128</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Balicer</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Luengo-Oroz</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cohen-Stavi</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Using big data for non-communicable disease surveillance</article-title><source>Lancet Diabetes Endocrinol</source><year>2018</year><month>08</month><volume>6</volume><issue>8</issue><fpage>595</fpage><lpage>598</lpage><pub-id pub-id-type="doi">10.1016/S2213-8587(17)30372-8</pub-id><pub-id pub-id-type="medline">29146206</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="web"><article-title>Digital 2024: Malaysia</article-title><source>Data Reportal</source><year>2024</year><access-date>2024-04-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://datareportal.com/reports/digital-2024-malaysia">https://datareportal.com/reports/digital-2024-malaysia</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Tonkin</surname><given-names>EL</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Tonkin</surname><given-names>EL</given-names> </name><name name-style="western"><surname>Tourte</surname><given-names>GJL</given-names> </name></person-group><source>A Day at Work (with Text): A Brief Introduction</source><year>2016</year><edition>1</edition><publisher-name>Chandos Publishing</publisher-name><fpage>23</fpage><lpage>60</lpage><pub-id pub-id-type="other">978-1-84334-749-1</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van Atteveldt</surname><given-names>W</given-names> </name><name name-style="western"><surname>van der Velden</surname><given-names>M</given-names> </name><name name-style="western"><surname>Boukes</surname><given-names>M</given-names> </name></person-group><article-title>The validity of sentiment analysis: comparing manual annotation, crowd-coding, dictionary approaches, and machine learning algorithms</article-title><source>Commun Methods Meas</source><year>2021</year><month>04</month><day>3</day><volume>15</volume><issue>2</issue><fpage>121</fpage><lpage>140</lpage><pub-id pub-id-type="doi">10.1080/19312458.2020.1869198</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Abualigah</surname><given-names>L</given-names> </name><name name-style="western"><surname>Alfar</surname><given-names>HE</given-names> </name><name name-style="western"><surname>Shehab</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hussein</surname><given-names>AMA</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Abd Elaziz</surname><given-names>M</given-names> </name><name name-style="western"><surname>Al-qaness</surname><given-names>MAA</given-names> </name><name name-style="western"><surname>Ewees</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Dahou</surname><given-names>A</given-names> </name></person-group><article-title>Sentiment analysis in healthcare: a brief review</article-title><source>Recent Advances in NLP: The Case of Arabic Language</source><year>2020</year><publisher-name>Springer International Publishing</publisher-name><fpage>29</fpage><lpage>141</lpage><pub-id pub-id-type="other">978-3-030-34614-0</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>L</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Li</surname><given-names>D</given-names> </name></person-group><article-title>Perception of the food and drug administration electronic cigarette flavor enforcement policy on twitter: observational study</article-title><source>JMIR Public Health Surveill</source><year>2022</year><month>03</month><day>29</day><volume>8</volume><issue>3</issue><fpage>e25697</fpage><pub-id pub-id-type="doi">10.2196/25697</pub-id><pub-id pub-id-type="medline">35348461</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shamoi</surname><given-names>E</given-names> </name><name name-style="western"><surname>Turdybay</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shamoi</surname><given-names>P</given-names> </name><name name-style="western"><surname>Akhmetov</surname><given-names>I</given-names> </name><name name-style="western"><surname>Jaxylykova</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pak</surname><given-names>A</given-names> </name></person-group><article-title>Sentiment analysis of vegan related tweets using mutual information for feature selection</article-title><source>PeerJ Comput Sci</source><year>2022</year><volume>8</volume><fpage>e1149</fpage><pub-id pub-id-type="doi">10.7717/peerj-cs.1149</pub-id><pub-id pub-id-type="medline">36532810</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rintyarna</surname><given-names>B</given-names> </name></person-group><article-title>Mapping acceptance of indonesian organic food consumption under COVID-19 pandemic using sentiment analysis of Twitter dataset</article-title><source>J Theor Appl Inf Technol</source><year>2021</year><access-date>2022-12-12</access-date><volume>99</volume><fpage>1009</fpage><lpage>1019</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://www.jatit.org/volumes/Vol99No5/1Vol99No5.pdf">https://www.jatit.org/volumes/Vol99No5/1Vol99No5.pdf</ext-link></comment></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaity</surname><given-names>M</given-names> </name><name name-style="western"><surname>Balakrishnan</surname><given-names>V</given-names> </name></person-group><article-title>An integrated semi-automated framework for domain-based polarity words extraction from an unannotated non-English corpus</article-title><source>J Supercomput</source><year>2020</year><month>12</month><volume>76</volume><issue>12</issue><fpage>9772</fpage><lpage>9799</lpage><pub-id pub-id-type="doi">10.1007/s11227-020-03222-0</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mogaji</surname><given-names>E</given-names> </name><name name-style="western"><surname>Balakrishnan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kieu</surname><given-names>TA</given-names> </name></person-group><article-title>Examining consumer behaviour in the UK Energy sector through the sentimental and thematic analysis of tweets</article-title><source>J of Consumer Behaviour</source><year>2021</year><month>03</month><volume>20</volume><issue>2</issue><fpage>218</fpage><lpage>230</lpage><pub-id pub-id-type="doi">10.1002/cb.1820</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karmegam</surname><given-names>D</given-names> </name><name name-style="western"><surname>Mappillairaju</surname><given-names>B</given-names> </name></person-group><article-title>Social media analytics and reachability evaluation - #Diabetes</article-title><source>Diabetes &#x0026; Metabolic Syndrome: Clinical Research &#x0026; Reviews</source><year>2022</year><month>01</month><volume>16</volume><issue>1</issue><fpage>102359</fpage><pub-id pub-id-type="doi">10.1016/j.dsx.2021.102359</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Najafizada</surname><given-names>M</given-names> </name><name name-style="western"><surname>Rahman</surname><given-names>A</given-names> </name><name name-style="western"><surname>Donnan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dong</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Bishop</surname><given-names>L</given-names> </name></person-group><article-title>Analyzing sentiments and themes on cannabis in Canada using 2018 to 2020 Twitter data</article-title><source>J Cannabis Res</source><year>2022</year><month>04</month><day>13</day><volume>4</volume><issue>1</issue><fpage>22</fpage><pub-id pub-id-type="doi">10.1186/s42238-022-00132-1</pub-id><pub-id pub-id-type="medline">35418169</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kasson</surname><given-names>E</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Cavazos-Rehg</surname><given-names>P</given-names> </name></person-group><article-title>Using a mixed methods approach to identify public perception of vaping risks and overall health outcomes on Twitter during the 2019 EVALI outbreak</article-title><source>Int J Med Inform</source><year>2021</year><month>11</month><volume>155</volume><fpage>104574</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2021.104574</pub-id><pub-id pub-id-type="medline">34592539</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chatterjee</surname><given-names>A</given-names> </name><name name-style="western"><surname>Prinz</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gerdes</surname><given-names>M</given-names> </name><name name-style="western"><surname>Martinez</surname><given-names>S</given-names> </name></person-group><article-title>Digital Interventions on healthy lifestyle management: systematic review</article-title><source>J Med Internet Res</source><year>2021</year><month>11</month><day>17</day><volume>23</volume><issue>11</issue><fpage>e26931</fpage><pub-id pub-id-type="doi">10.2196/26931</pub-id><pub-id pub-id-type="medline">34787575</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kohl</surname><given-names>LFM</given-names> </name><name name-style="western"><surname>Crutzen</surname><given-names>R</given-names> </name><name name-style="western"><surname>de Vries</surname><given-names>NK</given-names> </name></person-group><article-title>Online prevention aimed at lifestyle behaviors: a systematic review of reviews</article-title><source>J Med Internet Res</source><year>2013</year><month>07</month><day>16</day><volume>15</volume><issue>7</issue><fpage>e146</fpage><pub-id pub-id-type="doi">10.2196/jmir.2665</pub-id><pub-id pub-id-type="medline">23859884</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ong</surname><given-names>SQ</given-names> </name><name name-style="western"><surname>Pauzi</surname><given-names>MBM</given-names> </name><name name-style="western"><surname>Gan</surname><given-names>KH</given-names> </name></person-group><article-title>Text mining and determinants of sentiments towards the COVID-19 vaccine booster of Twitter users in Malaysia</article-title><source>Healthcare (Basel)</source><year>2022</year><month>05</month><day>27</day><volume>10</volume><issue>6</issue><fpage>994</fpage><pub-id pub-id-type="doi">10.3390/healthcare10060994</pub-id><pub-id pub-id-type="medline">35742045</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kent</surname><given-names>EE</given-names> </name><name name-style="western"><surname>Prestin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gaysynsky</surname><given-names>A</given-names> </name><etal/></person-group><article-title>&#x201C;Obesity is the New Major Cause of Cancer&#x201D;: connections between obesity and cancer on Facebook and Twitter</article-title><source>J Cancer Educ</source><year>2016</year><month>09</month><volume>31</volume><issue>3</issue><fpage>453</fpage><lpage>459</lpage><pub-id pub-id-type="doi">10.1007/s13187-015-0824-1</pub-id><pub-id pub-id-type="medline">25865399</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="confproc"><person-group person-group-type="editor"><name name-style="western"><surname>Hutto</surname><given-names>C</given-names> </name><name name-style="western"><surname>Gilbert</surname><given-names>E</given-names> </name></person-group><article-title>VADER: a parsimonious rule-based model for sentiment analysis of social media text</article-title><conf-name>Proceedings of the International AAAI Conference on Web and Social Media</conf-name><conf-date>Jun 1-4, 2014</conf-date><conf-loc>Ann Arbor, Michigan</conf-loc><pub-id pub-id-type="doi">10.1609/icwsm.v8i1.14550</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="confproc"><person-group person-group-type="editor"><name name-style="western"><surname>Elbagir</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>J</given-names> </name></person-group><article-title>Twitter sentiment analysis using natural language toolkit and VADER sentiment</article-title><conf-name>Proceedings of the International Multiconference of Engineers and Computer Scientists</conf-name><conf-date>Mar 13-15, 2019</conf-date><conf-loc>Hong Kong</conf-loc><pub-id pub-id-type="doi">10.1142/9789811215094_0005</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wan Min</surname><given-names>WNS</given-names> </name><name name-style="western"><surname>Zulkarnain</surname><given-names>NZ</given-names> </name></person-group><article-title>Comparative evaluation of lexicons in performing sentiment analysis</article-title><source>J Adv Res Comput Tech Software Appl</source><year>2020</year><month>06</month><day>18</day><access-date>2022-12-12</access-date><volume>2</volume><issue>1</issue><fpage>14</fpage><lpage>20</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://jacta.utem.edu.my/jacta/article/view/5207/3684">https://jacta.utem.edu.my/jacta/article/view/5207/3684</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Agarwal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>B</given-names> </name><name name-style="western"><surname>Vovsha</surname><given-names>I</given-names> </name><name name-style="western"><surname>Rambow</surname><given-names>O</given-names> </name></person-group><article-title>Sentiment analysis of Twitter data</article-title><conf-name>Proceedings of the Workshop on Languages in Social Media</conf-name><conf-date>Jun 23, 2011</conf-date><conf-loc>Portland, Oregon</conf-loc></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Emblem</surname><given-names>H</given-names> </name></person-group><article-title>Are you scared, VADER? Understanding how NLP pre-processing impacts VADER scoring</article-title><source>Medium</source><year>2021</year><access-date>2023-07-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://medium.com/data-science/are-you-scared-vader-understanding-how-nlp-pre-processing-impacts-vader-scoring-4f4edadbc91d">https://medium.com/data-science/are-you-scared-vader-understanding-how-nlp-pre-processing-impacts-vader-scoring-4f4edadbc91d</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mathieson</surname><given-names>S</given-names> </name><name name-style="western"><surname>O&#x2019;Keeffe</surname><given-names>M</given-names> </name><name name-style="western"><surname>Traeger</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Ferreira</surname><given-names>GE</given-names> </name><name name-style="western"><surname>Abdel Shaheed</surname><given-names>C</given-names> </name></person-group><article-title>Content and sentiment analysis of gabapentinoid-related tweets: an infodemiology study</article-title><source>Drug Alcohol Rev</source><year>2024</year><month>01</month><volume>43</volume><issue>1</issue><fpage>45</fpage><lpage>55</lpage><pub-id pub-id-type="doi">10.1111/dar.13590</pub-id><pub-id pub-id-type="medline">36539307</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Miller</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Jung Kim</surname><given-names>S</given-names> </name><name name-style="western"><surname>Schwartz-Bloom</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Bloom</surname><given-names>PN</given-names> </name><name name-style="western"><surname>Murphy</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Fuemmeler</surname><given-names>BF</given-names> </name></person-group><article-title>Informing women about the risks of exposing babies to tobacco smoke: outreach and education efforts using Facebook &#x201C;boost posts&#x201D;</article-title><source>Transl Behav Med</source><year>2022</year><month>05</month><day>26</day><volume>12</volume><issue>5</issue><fpage>714</fpage><lpage>720</lpage><pub-id pub-id-type="doi">10.1093/tbm/ibab158</pub-id><pub-id pub-id-type="medline">35532323</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="web"><article-title>Healthy living: what is a healthy lifestyle?</article-title><source>WHO Regional Office for Europe</source><year>1999</year><access-date>2022-12-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://iris.who.int/bitstream/handle/10665/108180/EUR_ICP_;jsessionid=A62C6B339873362BC61C7C8BC6088C38?sequence=1">https://iris.who.int/bitstream/handle/10665/108180/EUR_ICP_;jsessionid=A62C6B339873362BC61C7C8BC6088C38?sequence=1</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Norimah</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Safiah</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jamal</surname><given-names>K</given-names> </name><name name-style="western"><surname>Haslinda</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zuhaida</surname><given-names>H</given-names> </name><name name-style="western"><surname>Rohida</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Food consumption patterns: Findings from the Malaysian Adult Nutrition Survey (MANS)</article-title><source>Malays J Med Sci</source><year>2008</year><month>03</month><access-date>2022-12-12</access-date><volume>14</volume><issue>1</issue><comment><ext-link ext-link-type="uri" xlink:href="https://nutriweb.org.my/mjn/publication/14-1/b.pdf">https://nutriweb.org.my/mjn/publication/14-1/b.pdf</ext-link></comment></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kortteinen</surname><given-names>T</given-names> </name></person-group><article-title>Alcohol in Malaysia: the impact of social transformation</article-title><source>Contemp Drug Probl</source><year>1999</year><month>09</month><volume>26</volume><issue>3</issue><fpage>391</fpage><lpage>411</lpage><pub-id pub-id-type="doi">10.1177/009145099902600303</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Robert Lourdes</surname><given-names>TG</given-names> </name><name name-style="western"><surname>Abd Hamid</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Riyadzi</surname><given-names>MR</given-names> </name><etal/></person-group><article-title>Findings from a nationwide study on alcohol consumption patterns in an upper middle-income country</article-title><source>Int J Environ Res Public Health</source><year>2022</year><month>07</month><day>21</day><volume>19</volume><issue>14</issue><fpage>35886700</fpage><pub-id pub-id-type="doi">10.3390/ijerph19148851</pub-id><pub-id pub-id-type="medline">35886700</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaw</surname><given-names>G</given-names> </name><name name-style="western"><surname>Zimmerman</surname><given-names>M</given-names> </name><name name-style="western"><surname>Vasquez-Huot</surname><given-names>L</given-names> </name><name name-style="western"><surname>Karami</surname><given-names>A</given-names> </name></person-group><article-title>Deciphering latent health Information in social media using a mixed-methods design</article-title><source>Healthcare (Basel)</source><year>2022</year><month>11</month><day>19</day><volume>10</volume><issue>11</issue><fpage>2320</fpage><pub-id pub-id-type="doi">10.3390/healthcare10112320</pub-id><pub-id pub-id-type="medline">36421644</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hagger</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Hardcastle</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Chater</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mallett</surname><given-names>C</given-names> </name><name name-style="western"><surname>Pal</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chatzisarantis</surname><given-names>NLD</given-names> </name></person-group><article-title>Autonomous and controlled motivational regulations for multiple health-related behaviors: between- and within-participants analyses</article-title><source>Health Psychol Behav Med</source><year>2014</year><month>01</month><day>1</day><volume>2</volume><issue>1</issue><fpage>565</fpage><lpage>601</lpage><pub-id pub-id-type="doi">10.1080/21642850.2014.912945</pub-id><pub-id pub-id-type="medline">25750803</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ryan</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Deci</surname><given-names>EL</given-names> </name></person-group><article-title>Self-determination theory and the facilitation of intrinsic motivation, social development, and well-being</article-title><source>American Psychologist</source><year>2000</year><volume>55</volume><issue>1</issue><fpage>68</fpage><lpage>78</lpage><pub-id pub-id-type="doi">10.1037/0003-066X.55.1.68</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rutten</surname><given-names>GM</given-names> </name><name name-style="western"><surname>Meis</surname><given-names>JJM</given-names> </name><name name-style="western"><surname>Hendriks</surname><given-names>MRC</given-names> </name><name name-style="western"><surname>Hamers</surname><given-names>FJM</given-names> </name><name name-style="western"><surname>Veenhof</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kremers</surname><given-names>SPJ</given-names> </name></person-group><article-title>The contribution of lifestyle coaching of overweight patients in primary care to more autonomous motivation for physical activity and healthy dietary behaviour: results of a longitudinal study</article-title><source>Int J Behav Nutr Phys Act</source><year>2014</year><month>12</month><volume>11</volume><issue>1</issue><fpage>86</fpage><pub-id pub-id-type="doi">10.1186/s12966-014-0086-z</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Teixeira</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Patrick</surname><given-names>H</given-names> </name><name name-style="western"><surname>Mata</surname><given-names>J</given-names> </name></person-group><article-title>Why we eat what we eat: the role of autonomous motivation in eating behaviour regulation</article-title><source>Nutr Bull</source><year>2011</year><month>03</month><volume>36</volume><issue>1</issue><fpage>102</fpage><lpage>107</lpage><pub-id pub-id-type="doi">10.1111/j.1467-3010.2010.01876.x</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Silva</surname><given-names>MN</given-names> </name><name name-style="western"><surname>Markland</surname><given-names>D</given-names> </name><name name-style="western"><surname>Carra&#x00E7;a</surname><given-names>EV</given-names> </name><etal/></person-group><article-title>Exercise autonomous motivation predicts 3-yr weight loss in women</article-title><source>Med Sci Sports Exerc</source><year>2011</year><month>04</month><volume>43</volume><issue>4</issue><fpage>728</fpage><lpage>737</lpage><pub-id pub-id-type="doi">10.1249/MSS.0b013e3181f3818f</pub-id><pub-id pub-id-type="medline">20689448</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Hartmann-Boyce</surname><given-names>J</given-names> </name></person-group><article-title>Why can&#x2019;t scientists agree on e-cigarettes</article-title><source>The Guardian</source><year>2016</year><access-date>2023-05-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.theguardian.com/science/sifting-the-evidence/2016/sep/14/why-cant-scientists-agree-on-e-cigarettes-vaping">https://www.theguardian.com/science/sifting-the-evidence/2016/sep/14/why-cant-scientists-agree-on-e-cigarettes-vaping</ext-link></comment></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kwon</surname><given-names>M</given-names> </name><name name-style="western"><surname>Park</surname><given-names>E</given-names> </name></person-group><article-title>Perceptions and sentiments about electronic cigarettes on social media platforms: systematic review</article-title><source>JMIR Public Health Surveill</source><year>2020</year><month>01</month><day>15</day><volume>6</volume><issue>1</issue><fpage>e13673</fpage><pub-id pub-id-type="doi">10.2196/13673</pub-id><pub-id pub-id-type="medline">31939747</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="web"><article-title>Health minster: MOH to review tobacco generational endgame policy</article-title><source>Malay Mail</source><year>2022</year><access-date>2023-05-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.malaymail.com/news/malaysia/2022/12/08/health-minster-moh-to-review-tobacco-generational-endgame-policy/44238">https://www.malaymail.com/news/malaysia/2022/12/08/health-minster-moh-to-review-tobacco-generational-endgame-policy/44238</ext-link></comment></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="web"><article-title>Mixed sentiments towards smoking &#x2019;end game</article-title><source>New Straits Times</source><year>2022</year><access-date>2023-05-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nst.com.my/news/nation/2022/07/811829/mixed-sentiments-towards-smoking-end-game">https://www.nst.com.my/news/nation/2022/07/811829/mixed-sentiments-towards-smoking-end-game</ext-link></comment></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="web"><article-title>National strategic plan for cancer control programe, 2021-2025</article-title><source>International Cancer Control Partnership</source><year>2021</year><access-date>2024-08-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.iccp-portal.org/system/files/plans/National_Strategic_Plan_for_Cancer_Control_Programme_2021-2025.pdf">https://www.iccp-portal.org/system/files/plans/National_Strategic_Plan_for_Cancer_Control_Programme_2021-2025.pdf</ext-link></comment></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jusoh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Naing</surname><given-names>NN</given-names> </name><name name-style="western"><surname>Wan-Arfah</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Prevalence and factors influencing smoking behavior among female inmates in Malaysia</article-title><source>Healthcare (Basel)</source><year>2023</year><month>01</month><day>9</day><volume>11</volume><issue>2</issue><fpage>203</fpage><pub-id pub-id-type="doi">10.3390/healthcare11020203</pub-id><pub-id pub-id-type="medline">36673571</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Evans-Polce</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Castaldelli-Maia</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Schomerus</surname><given-names>G</given-names> </name><name name-style="western"><surname>Evans-Lacko</surname><given-names>SE</given-names> </name></person-group><article-title>The downside of tobacco control? Smoking and self-stigma: a systematic review</article-title><source>Soc Sci Med</source><year>2015</year><month>11</month><volume>145</volume><fpage>26</fpage><lpage>34</lpage><pub-id pub-id-type="doi">10.1016/j.socscimed.2015.09.026</pub-id><pub-id pub-id-type="medline">26439764</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Castaldelli-Maia</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Ventriglio</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bhugra</surname><given-names>D</given-names> </name></person-group><article-title>Tobacco smoking: From &#x201C;glamour&#x201D; to &#x201C;stigma&#x201D;. A comprehensive review</article-title><source>Psychiatry Clin Neurosci</source><year>2016</year><month>01</month><volume>70</volume><issue>1</issue><fpage>24</fpage><lpage>33</lpage><pub-id pub-id-type="doi">10.1111/pcn.12365</pub-id><pub-id pub-id-type="medline">26449875</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="web"><article-title>Flashback #star50: when smoking was banned at eateries</article-title><source>Star</source><year>2021</year><access-date>2023-05-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.thestar.com.my/news/nation/2021/10/20/flashback-star50-when-smoking-was-banned-at-eateries#:~:text=Malaysia%20enforced%20a%20no%2Dsmoking,rooms%20and%20ashtrays%20were%20prohibited">https://www.thestar.com.my/news/nation/2021/10/20/flashback-star50-when-smoking-was-banned-at-eateries#:~:text=Malaysia%20enforced%20a%20no%2Dsmoking,rooms%20and%20ashtrays%20were%20prohibited</ext-link></comment></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hawkins</surname><given-names>LK</given-names> </name><name name-style="western"><surname>Farrow</surname><given-names>C</given-names> </name><name name-style="western"><surname>Thomas</surname><given-names>JM</given-names> </name></person-group><article-title>Do perceived norms of social media users&#x2019; eating habits and preferences predict our own food consumption and BMI?</article-title><source>Appetite</source><year>2020</year><month>06</month><day>1</day><volume>149</volume><fpage>104611</fpage><pub-id pub-id-type="doi">10.1016/j.appet.2020.104611</pub-id><pub-id pub-id-type="medline">31958481</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Durau</surname><given-names>J</given-names> </name><name name-style="western"><surname>Diehl</surname><given-names>S</given-names> </name><name name-style="western"><surname>Terlutter</surname><given-names>R</given-names> </name></person-group><article-title>Motivate me to exercise with you: the effects of social media fitness influencers on users&#x2019; intentions to engage in physical activity and the role of user gender</article-title><source>Digit Health</source><year>2022</year><volume>8</volume><fpage>20552076221102769</fpage><pub-id pub-id-type="doi">10.1177/20552076221102769</pub-id><pub-id pub-id-type="medline">35615268</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnston</surname><given-names>C</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>WE</given-names> </name></person-group><article-title>Motivating exercise through social media: is a picture always worth a thousand words?</article-title><source>Psychol Sport Exerc</source><year>2019</year><month>03</month><volume>41</volume><fpage>119</fpage><lpage>126</lpage><pub-id pub-id-type="doi">10.1016/j.psychsport.2018.12.012</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mohamad Saleh</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Mehellou</surname><given-names>A</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>M</given-names> </name><name name-style="western"><surname>Briandana</surname><given-names>R</given-names> </name></person-group><article-title>Social media impact on sustainable intention and behaviour: a comparative study between university students in Malaysia and Indonesia</article-title><source>JARHE</source><pub-id pub-id-type="doi">10.1108/JARHE-10-2023-0479</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bauman</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bull</surname><given-names>F</given-names> </name><name name-style="western"><surname>Chey</surname><given-names>T</given-names> </name><etal/></person-group><article-title>The International Prevalence Study on Physical Activity: results from 20 countries</article-title><source>Int J Behav Nutr Phys Act</source><year>2009</year><month>03</month><day>31</day><volume>6</volume><issue>1</issue><fpage>21</fpage><pub-id pub-id-type="doi">10.1186/1479-5868-6-21</pub-id><pub-id pub-id-type="medline">19335883</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nik-Nasir</surname><given-names>NM</given-names> </name><name name-style="western"><surname>Md-Yasin</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ariffin</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Physical activity in Malaysia: are we doing enough? Findings from the REDISCOVER Study</article-title><source>Int J Environ Res Public Health</source><year>2022</year><month>12</month><day>15</day><volume>19</volume><issue>24</issue><fpage>16888</fpage><pub-id pub-id-type="doi">10.3390/ijerph192416888</pub-id><pub-id pub-id-type="medline">36554769</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Assanangkornchai</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sam-Angsri</surname><given-names>N</given-names> </name><name name-style="western"><surname>Rerngpongpan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lertnakorn</surname><given-names>A</given-names> </name></person-group><article-title>Patterns of alcohol consumption in the Thai population: results of the National Household Survey of 2007</article-title><source>Alcohol Alcohol</source><year>2010</year><volume>45</volume><issue>3</issue><fpage>278</fpage><lpage>285</lpage><pub-id pub-id-type="doi">10.1093/alcalc/agq018</pub-id><pub-id pub-id-type="medline">20348437</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="web"><article-title>Reporting about alcohol: a guide for journalists</article-title><source>World Health Organization</source><year>2023</year><access-date>2023-09-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://iris.who.int/bitstream/handle/10665/366715/9789240071490-eng.pdf?sequence=1">https://iris.who.int/bitstream/handle/10665/366715/9789240071490-eng.pdf?sequence=1</ext-link></comment></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abu Samah</surname><given-names>KAF</given-names> </name><name name-style="western"><surname>Nor Azharludin</surname><given-names>NM</given-names> </name><name name-style="western"><surname>Riza</surname><given-names>LS</given-names> </name><name name-style="western"><surname>Hasrol Jono</surname><given-names>MNH</given-names> </name><name name-style="western"><surname>Moketar</surname><given-names>NA</given-names> </name></person-group><article-title>Classification and visualization: Twitter sentiment analysis of Malaysia&#x2019;s private hospitals</article-title><source>IJ-AI</source><year>2023</year><month>03</month><day>10</day><volume>12</volume><issue>4</issue><fpage>1793</fpage><pub-id pub-id-type="doi">10.11591/ijai.v12.i4.pp1793-1802</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mohd Yuswardi</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ahmad</surname><given-names>NA</given-names> </name></person-group><article-title>Sentiment analysis of Malaysians citizen&#x2019;s emotion towards cyberbullying in Twitter</article-title><source>IJARBSS</source><year>2023</year><month>04</month><volume>13</volume><issue>4</issue><fpage>769</fpage><lpage>780</lpage><pub-id pub-id-type="doi">10.6007/IJARBSS/v13-i4/16777</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Malik</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lamba</surname><given-names>H</given-names> </name><name name-style="western"><surname>Nakos</surname><given-names>C</given-names> </name></person-group><article-title>Population bias in geotagged tweets</article-title><conf-name>Proceedings of the International AAAI Conference on Web and Social Media</conf-name><conf-date>May 26-29, 2015</conf-date><conf-loc>University of Oxford, Oxford, UK</conf-loc><pub-id pub-id-type="doi">10.1609/icwsm.v9i4.14688</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lane</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Habib</surname><given-names>D</given-names> </name><name name-style="western"><surname>Curtis</surname><given-names>B</given-names> </name></person-group><article-title>Linguistic methodologies to surveil the leading causes of mortality: scoping review of twitter for public health data</article-title><source>J Med Internet Res</source><year>2023</year><month>06</month><day>12</day><volume>25</volume><fpage>e39484</fpage><pub-id pub-id-type="doi">10.2196/39484</pub-id><pub-id pub-id-type="medline">37307062</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gore</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Diallo</surname><given-names>S</given-names> </name><name name-style="western"><surname>Padilla</surname><given-names>J</given-names> </name></person-group><article-title>You are what you tweet: connecting the geographic variation in America&#x2019;s obesity rate to Twitter content</article-title><source>PLoS ONE</source><year>2015</year><volume>10</volume><issue>9</issue><fpage>e0133505</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0133505</pub-id><pub-id pub-id-type="medline">26332588</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Owens</surname><given-names>J</given-names> </name><collab>Adolescent Sleep Working Group</collab><collab>Committee on Adolescence</collab></person-group><article-title>Insufficient sleep in adolescents and young adults: an update on causes and consequences</article-title><source>Pediatrics</source><year>2014</year><month>09</month><volume>134</volume><issue>3</issue><fpage>e921</fpage><lpage>32</lpage><pub-id pub-id-type="doi">10.1542/peds.2014-1696</pub-id><pub-id pub-id-type="medline">25157012</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="web"><article-title>How to determine the best social media platforms for your business</article-title><source>Emphatic</source><year>2024</year><access-date>2024-01-08</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://emphatic.co/how-to-determine-the-best-social-media-platforms-for-your-business">https://emphatic.co/how-to-determine-the-best-social-media-platforms-for-your-business</ext-link></comment></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Riserbato</surname><given-names>R</given-names> </name></person-group><article-title>What a social media target audience is and how to find it</article-title><source>Hubspot</source><year>2024</year><access-date>2024-01-08</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://blog.hubspot.com/marketing/social-media-target-audience">https://blog.hubspot.com/marketing/social-media-target-audience</ext-link></comment></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="book"><person-group person-group-type="editor"><name name-style="western"><surname>Huang</surname><given-names>M</given-names></name><name name-style="western"><surname>Rasool</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Qu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Kamyab</surname><given-names>M</given-names> </name></person-group><article-title>HSMC: hybrid sentiment method for correlation to analyze COVID-19 tweets</article-title><source>Advances in Natural Computation, Fuzzy Systems and Knowledge Discovery</source><year>2021</year><publisher-name>Cham: Springer International Publishing</publisher-name><pub-id pub-id-type="doi">10.1007/978-3-030-89698-0_101</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rasool</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>R</given-names> </name><name name-style="western"><surname>Marjan</surname><given-names>K</given-names> </name><name name-style="western"><surname>Naveed</surname><given-names>T</given-names> </name></person-group><article-title>Twitter sentiment analysis: a case study for apparel brands</article-title><source>J Phys: Conf Ser</source><year>2019</year><month>03</month><day>1</day><volume>1176</volume><issue>2</issue><fpage>022015</fpage><pub-id pub-id-type="doi">10.1088/1742-6596/1176/2/022015</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>List of keywords for data scraping of posts.</p><media xlink:href="infodemiology_v5i1e65835_app1.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Codebook.</p><media xlink:href="infodemiology_v5i1e65835_app2.docx" xlink:title="DOCX File, 27 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Word cloud representation of overall X dataset (n=3320).</p><media xlink:href="infodemiology_v5i1e65835_app3.png" xlink:title="PNG File, 2512 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Examples of posts with positive and negative sentiments according to each lifestyle behavior.</p><media xlink:href="infodemiology_v5i1e65835_app4.docx" xlink:title="DOCX File, 20 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Example of posts selected for manual content analysis.</p><media xlink:href="infodemiology_v5i1e65835_app5.docx" xlink:title="DOCX File, 23 KB"/></supplementary-material></app-group></back></article>