<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Infodemiology</journal-id>
      <journal-title>JMIR Infodemiology</journal-title>
      <issn pub-type="epub">2564-1891</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v4i1e51701</article-id>
      <article-id pub-id-type="pmid">39661980</article-id>
      <article-id pub-id-type="doi">10.2196/51701</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Uncovering the Top Nonadvertising Weight Loss Websites on Google: A Data-Mining Approach</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mackey</surname>
            <given-names>Tim</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Collins</surname>
            <given-names>Clare</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ciptaningtyas</surname>
            <given-names>Ratri</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Goldstein</surname>
            <given-names>Scott</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lopezosa</surname>
            <given-names>Carlos</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Almenara</surname>
            <given-names>Carlos A</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Health Sciences</institution>
            <institution>Universidad Peruana de Ciencias Aplicadas</institution>
            <addr-line>Av. Alameda San Marcos 11</addr-line>
            <addr-line>Lima, 15067</addr-line>
            <country>Peru</country>
            <fax>51 3133333</fax>
            <phone>51 3133333 ext 2803</phone>
            <email>carlos.almenara@upc.pe</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4929-8720</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Gulec</surname>
            <given-names>Hayriye</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9410-430X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Health Sciences</institution>
        <institution>Universidad Peruana de Ciencias Aplicadas</institution>
        <addr-line>Lima</addr-line>
        <country>Peru</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Interdisciplinary Research Team on Internet and Society</institution>
        <institution>Faculty of Social Studies</institution>
        <institution>Masaryk University</institution>
        <addr-line>Brno</addr-line>
        <country>Czech Republic</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Carlos A Almenara <email>carlos.almenara@upc.pe</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>11</day>
        <month>12</month>
        <year>2024</year>
      </pub-date>
      <volume>4</volume>
      <elocation-id>e51701</elocation-id>
      <history>
        <date date-type="received">
          <day>8</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>22</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>21</day>
          <month>8</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>24</day>
          <month>10</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Carlos A Almenara, Hayriye Gulec. Originally published in JMIR Infodemiology (https://infodemiology.jmir.org), 11.12.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Infodemiology, is properly cited. The complete bibliographic information, a link to the original publication on https://infodemiology.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://infodemiology.jmir.org/2024/1/e51701" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Online weight loss information is commonly sought by internet users, and it may impact their health decisions and behaviors. Previous studies examined a limited number of Google search queries and relied on manual approaches to retrieve online weight loss websites.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to identify and describe the characteristics of the top weight loss websites on Google.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This study gathered 432 Google search queries collected from Google autocomplete suggestions, “People Also Ask” featured questions, and Google Trends data. A data-mining software tool was developed to retrieve the search results automatically, setting English and the United States as the default criteria for language and location, respectively. Domain classification and evaluation technologies were used to categorize the websites according to their content and determine their risk of cyberattack. In addition, the top 5 most frequent websites in nonadvertising (ie, nonsponsored) search results were inspected for quality.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The results revealed that the top 5 nonadvertising websites were healthline.com, webmd.com, verywellfit.com, mayoclinic.org, and womenshealthmag.com. All provided accuracy statements and author credentials. The domain categorization taxonomy yielded a total of 101 unique categories. After grouping the websites that appeared less than 5 times, the most frequent categories involved “Health” (104/623, 16.69%), “Personal Pages and Blogs” (91/623, 14.61%), “Nutrition and Diet” (48/623, 7.7%), and “Exercise” (34/623, 5.46%). The risk of being a victim of a cyberattack was low.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The findings suggested that while quality information is accessible, users may still encounter less reliable content among various online resources. Therefore, better tools and methods are needed to guide users toward trustworthy weight loss information.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>consumer health informatics</kwd>
        <kwd>cyberattack risk</kwd>
        <kwd>data mining</kwd>
        <kwd>Google</kwd>
        <kwd>information seeking</kwd>
        <kwd>weight loss</kwd>
        <kwd>online health information</kwd>
        <kwd>website analysis</kwd>
        <kwd>digital health</kwd>
        <kwd>internet search</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Seeking online health information is prevalent among Americans [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. In 2013, a representative survey of adult internet users in the United States found that 27% had looked online for information about losing or controlling their weight in the last 12 months [<xref ref-type="bibr" rid="ref3">3</xref>]. General search engines are the first tool for health-related queries [<xref ref-type="bibr" rid="ref4">4</xref>]. With an average of over 80 billion monthly visits in 2022, Google is the most preferred search engine for such internet-based activity [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
      <p>Although limited, the available evidence points to a lack of quality and comprehensiveness regarding weight loss information in English and Spanish on websites in the United States and the German language web [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. It also indicates the potential risk of accessing information with doubtful credibility, such as deceiving advertisements about commercial and fad diets [<xref ref-type="bibr" rid="ref9">9</xref>]. These findings are concerning because online health information impacts health decisions and behaviors [<xref ref-type="bibr" rid="ref3">3</xref>]. Furthermore, low-quality or misleading information might be detrimental for those who have eating disorder-related symptomatology or obesity because previous research identified a higher frequency for the use of weight loss websites among individuals with body image and body weight concerns [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>Google Trends, an open-source repository, is a popular tool for retrieving the most common search queries about weight loss in previous studies [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. Yet, the Google search engine offers additional “Autocomplete Suggestions” and “People Also Ask” features based on users’ queries. To our knowledge, no previous study used search queries that combined the data from Google Trends and the additional features of the Google Search engine to determine the most frequently accessed weight loss websites. This study aimed to identify and describe the characteristics of the top weight loss websites on Google using an automated approach that combined data from Google Trends and the additional features of the Google Search engine.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Mining</title>
        <p>On April 6, 2021, a comprehensive list of 432 unique search queries about weight loss (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) was retrieved from the Answer Socrates database [<xref ref-type="bibr" rid="ref15">15</xref>] with the search term “weight loss” (without quotations). Answer Socrates is a database of users’ search queries combining Google search suggestions (Autocomplete Suggestions), “People Also Ask” featured questions and Google Trends data. We developed a data-mining software tool (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>) to search for each query in Google and automatically retrieve the results. The tool sets the United States as the default geographical location and English as the default language. In this study, we set the United States as the default location because it is the largest English-speaking country. According to Google Trends, the third largest volume of “weight loss” searches since 2004 has occurred in the United States, after Trinidad and Tobago and South Africa [<xref ref-type="bibr" rid="ref16">16</xref>]. The tool was developed with Python (Python Software Foundation) programming language and designed to gather Google Search engine results through an application programming interface (API) developed by SerpApi [<xref ref-type="bibr" rid="ref17">17</xref>]. More precisely, it is a Python-code tool for data mining that automatically searches each query on Google and retrieves the results for each query in a JSON file. Each JSON file contains Google advertising results, “Google Places” results, “People Also Ask” results, and organic search results, including web address, title, and description. Organic results are nonadvertising (ie, nonsponsored) search results that appear because they are relevant to the search terms [<xref ref-type="bibr" rid="ref18">18</xref>]. By contrast, nonorganic or sponsored or advertising results are paid advertisements and appear above organic results. The Python code tool creates a database (a CSV file) that includes the top 100 organic results for each query (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). To test for the validity of this software tool, the first author performed a manual verification. The tool was set to Peru as the default geographical location because the first author was located in Peru. English was set as the default language because 10 queries were randomly selected from the total of 432 English queries used in this study. A manual search in Google was done separately for each of those 10 queries to compare the results obtained with the software tool. The manual searches were done with an anonymous web browser (Mozilla Firefox) in Peru, with English as the default language of the search engine. The key data (ie, title, description, URL) of the first 10 nonadvertising results for each query were compared, and no differences were found. The tool was used on April 14, 2021. This study focused solely on organic search results. This decision was based on the fact that advertising or sponsored results have already been studied, although several years ago [<xref ref-type="bibr" rid="ref6">6</xref>], and they are idiosyncratic because they are regulated by algorithms. In other words, advertising results are tailored to each user and, therefore, do not represent the results retrieved for all users, as is the case for organic results.</p>
      </sec>
      <sec>
        <title>Data Analyses</title>
        <p>The data analysis procedure is represented in the flowchart below (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Steps of the data analysis procedure.</p>
          </caption>
          <graphic xlink:href="infodemiology_v4i1e51701_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>First, the most frequent websites for the top 5 Google Search results were calculated using Python code (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). This study focused on the top 5 organic search results because nearly 90% of the clicks occur on Google’s first 5 nonadvertising results [<xref ref-type="bibr" rid="ref7">7</xref>]. This clicking behavior might suggest users’ tendency to perceive the information presented at the top as most relevant and helpful. Since we focused on queries looking for answers about weight loss on websites, we expected a similar clicking behavior in this study. Next, the 5 most frequent websites were manually inspected to evaluate their accuracy. Like previous studies [<xref ref-type="bibr" rid="ref6">6</xref>], we examined whether the websites presented an “accuracy statement” that indicated that the provided information was evidence-based, fact-checked, or, at least, had been reviewed to ensure its trustworthiness. Any statement like this within the website indicated that the website provided an accuracy statement. The websites were also examined to evaluate whether author credentials were disclosed when weight loss information was provided. When the authorship of the weight loss information was given, the website was regarded as providing author credentials.</p>
        <p>Then, all the unique websites that appeared in the top 5 results were categorized. There are several methods to categorize websites, including manual and automated processes. A recent study examined several domain classification services and provided directions for future research using website categories⁠ [<xref ref-type="bibr" rid="ref19">19</xref>]. The study found that manual categorization of websites tends to be biased due to disagreements resulting from subjective opinions. In addition, the inherent ambiguity of many categories in taxonomy and the dual nature of many websites contribute to this bias [<xref ref-type="bibr" rid="ref19">19</xref>]. For example, taxonomies containing thousands of categories and websites with ambiguous content, such as tourism blogs advertising casinos, make it difficult to categorize them manually. On the other hand, the study found that domain classification services vary in coverage, meaning that some websites are categorized because the service indexes them, whereas others do not. Furthermore, the accuracy of the categorization is affected by inconsistent taxonomies. Finally, there is low agreement among these services. Consequently, the authors suggest that researchers can manually examine random subsets of categorizations to determine if the labeling quality is sufficient for the purpose of the research study and rely on classification services with category labels acquired through a well-documented process and incorporated into a thoroughly vetted taxonomy [<xref ref-type="bibr" rid="ref19">19</xref>]. Based on those results and recommendations, the following domain classification services were tested: BrightCloud, Curlie, Cyren, FortiGuard, McAfee, VirusTotal, and Zvelo. After manually inspecting the results, we found that Zvelo [<xref ref-type="bibr" rid="ref20">20</xref>] produced the most meaningful and accurate classification labels with a reasonable number of categories (nearly 500).</p>
        <p>Zvelo is a domain classification service with more than 13 years of service. The categories are generated by Zvelo’s human-supervised artificial intelligence (AI) models, and they currently use fourth-generation AI models (personal communication, January 31, 2023). For each URL (ie, web address), the Zvelo database provides 3 classification groups, each with up to 3 categories [<xref ref-type="bibr" rid="ref20">20</xref>]. The first group is the primary classification provided by Zvelo; this is the one used in this study. The other two are additional categorizations provided by the Interactive Advertising Bureau (IAB), a marketing-orientated taxonomy [<xref ref-type="bibr" rid="ref21">21</xref>]. Consistent with the recommendations made by Vallina et al [<xref ref-type="bibr" rid="ref19">19</xref>], Zvelo was preferred over the IAB taxonomy because it provided more extensive coverage of the websites in the dataset. The manual inspection of the website categories revealed that Zvelo’s category labels were also more relevant to the content than the IAB’s. This observation is probably because the IAB is a marketing-oriented domain classification service. We also preferred the Zvelo classification due to its state-of-the-art AI technology use. All categories for each URL are available in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. The categories were retrieved between January 2023 and February 2023.</p>
        <p>Finally, each URL was given a reputation score based on Webroot’s BrightCloud IP Reputation Services [<xref ref-type="bibr" rid="ref22">22</xref>]. The reputation score predicts the risk that an IP will deliver a cyberattack (ie, it identifies malicious addresses). Scores are obtained using big data and a machine-learning algorithm. Scores are grouped into 5 categories: High-risk (1-20), Suspicious (21-40), Moderate-risk (41-60), Low-risk (61-80), and Trustworthy (81-100) [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>Given that no human participants participated in this study and the data were public, the study was deemed exempt from the institutional review board approval process.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>After applying the Python-code tool to each JSON file, a CSV file was created containing a database with the 432 search queries and the Top 100 organic search results (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p>
      <p><xref ref-type="table" rid="table1">Table 1</xref> shows the count of the most frequent website results, the trustworthiness, the reputation, and the web categorization of the top 5 website results.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>The 5 most frequent websites within the top 5 Google search results (N=2160).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="240"/>
          <col width="150"/>
          <col width="150"/>
          <col width="150"/>
          <col width="150"/>
          <col width="160"/>
          <thead>
            <tr valign="top">
              <td>Website</td>
              <td>Total<sup>a</sup>, n (%)</td>
              <td>Accuracy statement</td>
              <td>Author credentials</td>
              <td>Reputation (0-100)<sup>b</sup></td>
              <td>Category</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>healthline.com</td>
              <td>197 (9.12)</td>
              <td>Yes</td>
              <td>Yes</td>
              <td>96</td>
              <td>Health</td>
            </tr>
            <tr valign="top">
              <td>webmd.com</td>
              <td>91 (4.21)</td>
              <td>Yes</td>
              <td>Yes</td>
              <td>96</td>
              <td>Health</td>
            </tr>
            <tr valign="top">
              <td>verywellfit.com</td>
              <td>85 (3.94)</td>
              <td>Yes</td>
              <td>Yes</td>
              <td>88</td>
              <td>Nutrition &#38; diet</td>
            </tr>
            <tr valign="top">
              <td>mayoclinic.org</td>
              <td>79 (3.66)</td>
              <td>Yes</td>
              <td>Yes</td>
              <td>100</td>
              <td>Health</td>
            </tr>
            <tr valign="top">
              <td>womenshealthmag.com</td>
              <td>61 (2.82)</td>
              <td>Yes</td>
              <td>Yes</td>
              <td>88</td>
              <td>Women’s health</td>
            </tr>
            <tr valign="top">
              <td>Other</td>
              <td>1647 (76.25)</td>
              <td>—<sup>c</sup></td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td>Total</td>
              <td>2160 (100)</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>Total number of times the website appeared in the top 5 results.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>Cyberattack risk. Scores higher than 80 indicate a trustworthy website.</p>
          </fn>
          <fn id="table1fn3">
            <p><sup>c</sup>Not applicable.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>There were 2160 results (the first 5 organic search results multiplied by 432 queries) and 623 unique websites (<xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). The most frequent website was healthline.com, which appeared 197/2160 (9.12%) times in the top 5 organic search results. This was followed by webmed.com, verywellfit.com, mayoclinic.org, and womenshealthmag.com. These top 5 most frequent websites provided accuracy statements (eg, fact-check statements) and author credentials. The authors of healthline.com, webmd.com, and verywellfit.com were usually health care professionals. In the case of mayoclinic.org, the authorship was usually declared as “Mayo Clinic Staff.” womenshealthmag.com had several authors who were described as “freelance writers.” In addition, healthline.com, verywellfit.com, and womenshealthmag.com explicitly provided a fact-check statement to assure users that the information was evidence-based and written by health care professionals.</p>
      <p>Next, the 623 websites were categorized by the Zvelo categorization taxonomy [<xref ref-type="bibr" rid="ref23">23</xref>]. In total, 101 unique categories were found (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). The categories with less than 5 appearances were grouped into “Other Categories.” As can be seen in <xref rid="figure2" ref-type="fig">Figure 2</xref>, most websites appeared less than 5 times (Other categories: 132/623 times, 21.23%), indicating a large diversity of results.</p>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Frequency and percentage of website categories.</p>
        </caption>
        <graphic xlink:href="infodemiology_v4i1e51701_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>The following most common categories were “Health” (104/623, 16.69%) and “Personal Pages and Blogs” (91/623, 14.61%), followed far behind by “Nutrition and Diet” (48/623, 7.7%) and “Exercise” (34/623, 5.46%). The most common websites in the “Health” category tended to ensure that they provided the most reliable information (eg, healthline.com). By contrast, “Personal Pages and Blogs” had little to no information about the authorship and accuracy of the information provided, although with some exemptions (eg, thehealthy.com).</p>
      <p><xref ref-type="table" rid="table2">Table 2</xref> shows the 5 most frequent websites for the most frequent categories (not including the “Other Categories”).</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Examples of the most frequent websites for the top categories.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="82"/>
          <col width="234"/>
          <col width="246"/>
          <col width="223"/>
          <col width="215"/>
          <thead>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Health</td>
              <td>Personal pages and blogs</td>
              <td>Nutrition and diet</td>
              <td>Exercise</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>1</td>
              <td>healthline.com</td>
              <td>simple-nourished-living.com</td>
              <td>verywellfit.com</td>
              <td>shape.com</td>
            </tr>
            <tr valign="top">
              <td>2</td>
              <td>webmd.com</td>
              <td>obesitycoverage.com</td>
              <td>livestrong.com</td>
              <td>muscleandfitness.com</td>
            </tr>
            <tr valign="top">
              <td>3</td>
              <td>mayoclinic.org</td>
              <td>thehealthy.com</td>
              <td>mediweightloss.com</td>
              <td>core-trainingpt.com</td>
            </tr>
            <tr valign="top">
              <td>4</td>
              <td>medicalnewstoday.com</td>
              <td>developgoodhabits.com</td>
              <td>precisionnutrition.com</td>
              <td>sparkpeople.com</td>
            </tr>
            <tr valign="top">
              <td>5</td>
              <td>prevention.com</td>
              <td>blog.myfitnesspal.com</td>
              <td>trifectanutrition.com</td>
              <td>thinwithin.com</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>With some exemptions (4.01%), most websites ranked 79 or higher (95.99%) in reputation, with a mean reputation score of 89.85 (SD 8.53). This finding indicates that the average reputation score of websites was trustworthy (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). The reputation scores for the 5 most frequent websites within the top 5 Google search results are displayed in <xref ref-type="table" rid="table1">Table 1</xref><bold>.</bold></p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study identified and described the characteristics of the top weight loss websites on Google using an automated approach that combined data from Google Trends and the additional features of the Google Search engine. The 5 most frequent websites for weight loss were healthline.com, webmd.com, verywellfit.com, mayoclinic.org, and womenshealthmag.com. They provided fact-checked or evidence-based information about weight loss, written by health care professionals with disclosed credentials. We used the Zvelo domain classification service to categorize the search results. The results yielded a wide diversity of website categories. The most common category was “Other Categories,” accounting for around one-fifth of all websites. It was followed by “Health,” “Personal Pages and Blogs,” “Nutrition and Diet,” and “Exercise” categories, which altogether accounted for 45% (277/623) of the search results. When we examined the most frequent 5 websites under these categories, only the “Health” category involved websites with fact-checked or evidence-based weight loss information that disclosed the author’s credentials. By comparison, the information on authorship and the accuracy of the statements was mainly lacking in the “Personal Pages and Blogs,” “Nutrition and Diet,” and “Exercise” categories. Finally, we found that the average reputation of all websites was trustworthy, which indicates that there is no security risk and users are very unlikely to be victims of cyberattacks by these weight loss websites.</p>
      </sec>
      <sec>
        <title>Comparison With Previous Work</title>
        <p>Previous studies found that websites with higher quality and comprehensiveness rank low in the search results [<xref ref-type="bibr" rid="ref6">6</xref>]. Although we identified that evidence-based and fact-checked information was conveyed by the most frequent websites in the top 5 organic search results, it should be noted that what users retrieve as a result of their search queries may not always lead them to the websites with credible information, given that they represent only a fraction of the total number of websites. Furthermore, websites with quality content may get lost among the myriad results, including advertising results that appear first on websites like Google.</p>
        <p>Previous studies adopted the standard website nomenclature and manual categorization of websites based on their source (eg, commercial sites, medical sites, government sites, university sites, news sites, online media sites, and blogs) [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. In this study, we used the Zvelo domain classification service, which uses an AI-based classification engine to apply a topic-based taxonomy for URL classification. Given that we applied this approach for the first time on weight loss websites, there is no previous evidence to compare our findings. Nevertheless, it is noteworthy that earlier studies reported nutrition and exercise as the most frequently addressed topics across the website categories on weight loss. We found that “Personal Pages and Blogs” was a frequent category in the search results, which means that individuals who seek online weight loss information might frequently encounter personal accounts and histories on English-language weight loss websites in the United States. Given that the most frequent websites under “Personal Pages and Blogs,” “Nutrition and Diet,” and “Exercise” categories have suboptimal quality, users who endorse these websites may be at risk of inadequate and even misleading information.</p>
      </sec>
      <sec>
        <title>Future Directions</title>
        <p>In this study, we evaluated the 5 most frequent websites under each category and determined whether they disclosed author credentials and an accuracy statement to ensure their quality. As a next step, future studies can examine each topic category based on other quality criteria, such as the frequency and scope of the evidence-based information provided using manual or automated approaches. This information might give a more in-depth understanding of the content and quality of the website categories. For instance, websites in the “Health” category might be more trustworthy because they integrate a more holistic approach by addressing several evidence-based domains (eg, healthy eating, nutrition, diet, exercise, pharmacotherapy, and behavioral change strategies) for successful weight loss.</p>
        <p>Cyberattacks have social and psychological consequences, such as the series of emotional reactions that can follow a cyberattack (feeling violated, powerless, angry, rage, grief, shame, etc), and previous research has highlighted the importance of addressing them [<xref ref-type="bibr" rid="ref24">24</xref>]. Thus, there are diverse opportunities for future studies, such as studying how cyberattacks target weight loss advertisements and the psychological consequences of these attacks for individuals looking to lose weight.</p>
      </sec>
      <sec>
        <title>Strengths</title>
        <p>Previous studies generated search queries with convenience samples for the terms with which people would search the internet for weight loss information [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. The search terms were then categorized and submitted to the Google Trends repository to obtain the final search queries. The total number of search queries ranged between 26 and 30. In this study, we retrieved 432 unique search queries from Answer Socrates [<xref ref-type="bibr" rid="ref15">15</xref>], which combined Google search suggestions (Autocomplete suggestions), “People Also Ask” featured questions and Google Trends data. We also used a data-mining software tool to determine the top 5 most frequent websites that appeared among the 5 organic search results. This study provided initial evidence that a data-mining software tool can help identify the most common websites for weight loss. This automated approach might also help to inspect other health-related search queries submitted to the Google search engine.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Although this study has strengths, such as the large number of search queries used and the automated approach to retrieve search results and categorize websites, it has some limitations. First, our results are concerned with English-language websites found in the United States; thus, they cannot be generalized to other locations. Further research may focus on different locations for English search queries related to weight loss and compare the Google search results across locations. Second, notwithstanding the fact that actual Google users make the search queries, it is unclear how Google selects them. Therefore, future studies could use different approaches, such as an ecological design, to gather search queries when users search the internet for weight loss information. For example, real-time data capture techniques, including an ecological momentary assessment, can be used in a large sample to study the behavior of individuals while looking for weight loss information [<xref ref-type="bibr" rid="ref25">25</xref>]. Such a design also has the advantage of tracking various concurrent details, such as the time of day, the season, the geographical location, sociodemographics, anthropometrics, and current mood, to study their association with the search terms. Similarly, case study research can be used to explore this phenomenon because it allows for an in-depth exploration of individual behaviors, contextual influences, and the factors that shape the information-seeking process [<xref ref-type="bibr" rid="ref26">26</xref>]. This approach would help develop a comprehensive understanding of how individuals interact with weight loss information online, including the challenges they face and the strategies they use to navigate the abundance of available online information.</p>
        <p>Third, we used a data-driven and AI-based domain classification approach using Zvelo. Nevertheless, the categories produced by Zvelo were not readily interpretable. There was a broad diversity of website categories and possible overlaps between them (eg, “Nutrition &#38; Diet,” “Health-Low Fat Cooking,” “Food &#38; Drink”). The interpretability of AI-based domain classification should be determined in future studies. Fourth, we manually inspected websites to find the accuracy statements (eg, fact-check statements). These statements were usually in sections like “About Us.” Unfortunately, this method is time-consuming, so future studies can look for a way to automate this task so that all the websites can be examined for accuracy statements. For example, a third-party authenticator can provide a certificate to websites that provide accurate information about weight loss and an API to developers so they can easily access this information.</p>
        <p>Fifth, from the data-mining results, it was clear that sponsored results (ie, advertising), which were not included in the analyses, were assigned the top results in Google searches. Weight loss advertising already has many deceiving pieces of information, with hundreds of cases presented to the Federal Trade Commission⁠ [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. In addition, Google’s online advertising is regulated by algorithms that consider idiosyncratic information about the internet user, such as sociodemographic information, so the ads are better tailored to the user. Future studies could evaluate how this information is displayed to the user, how users interact with it, and how they use it in their everyday lives, particularly in their attempts to lose weight, to evaluate the risks and benefits of interacting with online advertising results. These studies could use an automated approach like the one used in this study.</p>
        <p>Therefore, initiatives should be taken to improve web results so that users can get reliable information about weight loss. For example, a web browser plugin that identifies the top health websites can mark them with an icon so that users can quickly identify them. An example of such a web browser plugin is Web of Trust [<xref ref-type="bibr" rid="ref29">29</xref>], which provides a website reputation rating, and it marks URLs with a green (trusted), yellow (suspicious), red (untrusted), or gray (unknown) icon.</p>
        <p>Furthermore, governments can create policies to ensure websites disclose how they handle misinformation and fact-checking. Websites can also be required to label content that has been fact-checked, along with the source of the fact-check. Weight loss information generated by AI, such as ChatGPT, should also be disclosed. Internet users should look up websites for the “accuracy statements” indicating that the weight loss information is “evidence-based,” “fact-checked,” or at least “reviewed by” to ensure its trustworthiness. Similarly, consumers should inspect whether author credentials are disclosed when weight loss information is provided, such as the name of the person who wrote the information, their profession, academic degrees, and links to further professional information (eg, LinkedIn profile page). Software developers can design algorithms to down-rank or flag potentially misleading content or design web browser plugins to alert users interacting with misinformation.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We developed a data-mining approach to identify and evaluate the top nonadvertising weight loss websites found through Google searches and analyzed 432 search queries. The 5 most frequent websites were healthline.com, webmd.com, verywellfit.com, mayoclinic.org, and womenshealthmag.com. These sites consistently provided fact-checked, evidence-based information with author credentials, indicating high trustworthiness. We also classified websites into various categories using an automated approach and found “Health,” “Personal Pages and Blogs,” “Nutrition and Diet,” and “Exercise” as the most common categories. The findings suggested that while quality information is accessible, users may still encounter less reliable content among various online resources. Therefore, better tools and methods are needed to guide users toward trustworthy weight loss information.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Queries.</p>
        <media xlink:href="infodemiology_v4i1e51701_app1.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 17 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Python code.</p>
        <media xlink:href="infodemiology_v4i1e51701_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 1731 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Results.</p>
        <media xlink:href="infodemiology_v4i1e51701_app3.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 1031 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Categories.</p>
        <media xlink:href="infodemiology_v4i1e51701_app4.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 36 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Google weight loss total count of top 5.</p>
        <media xlink:href="infodemiology_v4i1e51701_app5.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 25 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">IAB</term>
          <def>
            <p>Interactive Advertising Bureau</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This output was supported by the “Systemic Risk Institute” (number LX22NPO5101), funded by the European Union - Next Generation EU (Ministry of Education, Youth and Sports, NPO: EXCELES). The authors declare that generative artificial intelligence was not used in ideation or in the writing of any portion of the manuscript or Python code.</p>
    </ack>
    <notes>
      <title>Data Availability</title>
      <p>The datasets generated during and/or analyzed during this study are available in the Open Science Framework repository [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Amuta</surname>
              <given-names>AO</given-names>
            </name>
            <name name-style="western">
              <surname>Jeon</surname>
              <given-names>KC</given-names>
            </name>
          </person-group>
          <article-title>Health information seeking in the digital age: an analysis of health information seeking behavior among US adults</article-title>
          <source>Cogent Soc Sci</source>
          <year>2017</year>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>1302785</fpage>
          <pub-id pub-id-type="doi">10.1080/23311886.2017.1302785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rideout</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Peebles</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Robb</surname>
              <given-names>MB</given-names>
            </name>
          </person-group>
          <source>Coping with COVID-19: How young people use digital media to manage their mental health</source>
          <access-date>2024-10-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.commonsensemedia.org/sites/default/files/research/report/2021-coping-with-covid19-full-report.pdf">https://www.commonsensemedia.org/sites/default/files/research/report/2021-coping-with-covid19-full-report.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Health online 2013</source>
          <access-date>2021-11-17</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pewinternet.org/2013/01/15/health-online-2013/">http://www.pewinternet.org/2013/01/15/health-online-2013/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Online health search 2006</source>
          <access-date>2021-10-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pewresearch.org/internet/2006/10/29/online-health-search-2006/">https://www.pewresearch.org/internet/2006/10/29/online-health-search-2006/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <article-title>Google</article-title>
          <source>Similarweb</source>
          <year>2023</year>
          <access-date>2023-02-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.similarweb.com/website/google.com/">https://www.similarweb.com/website/google.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Modave</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Shokar</surname>
              <given-names>NK</given-names>
            </name>
            <name name-style="western">
              <surname>Peñaranda</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Analysis of the accuracy of weight loss information search engine results on the internet</article-title>
          <source>Am J Public Health</source>
          <year>2014</year>
          <volume>104</volume>
          <issue>10</issue>
          <fpage>1971</fpage>
          <lpage>1978</lpage>
          <pub-id pub-id-type="doi">10.2105/AJPH.2014.302070</pub-id>
          <pub-id pub-id-type="medline">25122030</pub-id>
          <pub-id pub-id-type="pmcid">PMC4167115</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cardel</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Chavez</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Peñaranda</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Modave</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Accuracy of weight loss information in Spanish search engine results on the internet</article-title>
          <source>Obesity (Silver Spring)</source>
          <year>2016</year>
          <volume>24</volume>
          <issue>11</issue>
          <fpage>2422</fpage>
          <lpage>2434</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27653438"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/oby.21646</pub-id>
          <pub-id pub-id-type="medline">27653438</pub-id>
          <pub-id pub-id-type="pmcid">PMC5117437</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Elsweiler</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Assessing the quality of weight loss information on the German language web</article-title>
          <source>Mov Nutr Heal Dis</source>
          <year>2020</year>
          <volume>3</volume>
          <fpage>39</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.22233/9781910443361-3e.9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Passos</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Vasconcellos-Silva</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Santos</surname>
              <given-names>LADS</given-names>
            </name>
          </person-group>
          <article-title>Cycles of attention to fad diets and internet search trends by Google trends</article-title>
          <source>Cien Saude Colet</source>
          <year>2020</year>
          <volume>25</volume>
          <issue>7</issue>
          <fpage>2615</fpage>
          <lpage>2631</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.scielo.br/scielo.php?script=sci_arttext&#38;pid=S1413-81232020000702615&#38;lng=en&#38;nrm=iso&#38;tlng=en"/>
          </comment>
          <pub-id pub-id-type="doi">10.1590/1413-81232020257.23892018</pub-id>
          <pub-id pub-id-type="medline">32667545</pub-id>
          <pub-id pub-id-type="pii">S1413-81232020000702615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Almenara</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Machackova</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Smahel</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Sociodemographic, attitudinal, and behavioral correlates of using nutrition, weight loss, and fitness websites: an online survey</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <volume>21</volume>
          <issue>4</issue>
          <fpage>e10189</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/4/e10189/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10189</pub-id>
          <pub-id pub-id-type="medline">30946018</pub-id>
          <pub-id pub-id-type="pii">v21i4e10189</pub-id>
          <pub-id pub-id-type="pmcid">PMC6470462</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coogan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sui</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Raubenheimer</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Gluttony and guilt: monthly trends in internet search query data are comparable with national-level energy intake and dieting behavior</article-title>
          <source>Palgrave Commun</source>
          <year>2018</year>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1057/s41599-017-0055-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madden</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>The seasonal periodicity of healthy contemplations about exercise and weight loss: ecological correlational study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2017</year>
          <volume>3</volume>
          <issue>4</issue>
          <fpage>e92</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2017/4/e92/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.7794</pub-id>
          <pub-id pub-id-type="medline">29237582</pub-id>
          <pub-id pub-id-type="pii">v3i4e92</pub-id>
          <pub-id pub-id-type="pmcid">PMC5745351</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pawar</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Nagpal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pawar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lerman</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Eirin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>General public's information-seeking patterns of topics related to obesity: Google trends analysis</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>e20923</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/3/e20923/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/20923</pub-id>
          <pub-id pub-id-type="medline">32633725</pub-id>
          <pub-id pub-id-type="pii">v6i3e20923</pub-id>
          <pub-id pub-id-type="pmcid">PMC7448178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Teng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S-W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Seasonal variation and trends in the Internet searches for losing weight: an infodemiological study</article-title>
          <source>Obes Res Clin Pract</source>
          <year>2020</year>
          <volume>14</volume>
          <issue>3</issue>
          <fpage>225</fpage>
          <lpage>233</lpage>
          <pub-id pub-id-type="doi">10.1016/j.orcp.2020.04.001</pub-id>
          <pub-id pub-id-type="medline">32349915</pub-id>
          <pub-id pub-id-type="pii">S1871-403X(19)30637-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
          <source>AnswerSocrates</source>
          <year>2023</year>
          <access-date>2021-04-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://answersocrates.com/">https://answersocrates.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Google Trends</collab>
          </person-group>
          <source>Weight loss</source>
          <year>2023</year>
          <access-date>2023-01-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://trends.google.com/trends/explore?date=all&#38;q=weight%20loss&#38;hl=en">https://trends.google.com/trends/explore?date=all&#38;q=weight%20loss&#38;hl=en</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>SerpApi</collab>
          </person-group>
          <source>Google search engine results API</source>
          <year>2021</year>
          <access-date>2021-04-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://serpapi.com/search-api">https://serpapi.com/search-api</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Google</collab>
          </person-group>
          <source>Organic search result</source>
          <year>2023</year>
          <access-date>2023-05-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://support.google.com/google-ads/answer/6054492">https://support.google.com/google-ads/answer/6054492</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vallina</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>PV</given-names>
            </name>
            <name name-style="western">
              <surname>Feal</surname>
              <given-names>Á</given-names>
            </name>
            <name name-style="western">
              <surname>Paraschiv</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gamba</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hohlfeld</surname>
              <given-names>OH</given-names>
            </name>
            <name name-style="western">
              <surname>Tapiador</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vallina-Rodriguez</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Mis-shapes, mistakes, misfits: an analysis of domain classification services</article-title>
          <year>2020</year>
          <conf-name>Proceedings of the ACM Internet Measurement Conference</conf-name>
          <conf-date>2020 October 27-29</conf-date>
          <conf-loc>Virtual Event USA</conf-loc>
          <publisher-loc>New York, NY, United States</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>598</fpage>
          <lpage>618</lpage>
          <pub-id pub-id-type="doi">10.1145/3419394.3423660</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Zvelo</collab>
          </person-group>
          <source>zveloDB™ URL Database</source>
          <year>2023</year>
          <access-date>2023-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://zvelo.com/zvelodb-url-database">https://zvelo.com/zvelodb-url-database</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Interactive Advertising Bureau</collab>
          </person-group>
          <source>Content taxonomy</source>
          <year>2023</year>
          <access-date>2023-01-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.iab.com/guidelines/content-taxonomy/">https://www.iab.com/guidelines/content-taxonomy/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>BrightCloud</collab>
          </person-group>
          <source>URL or IP Lookup</source>
          <access-date>2023-01-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.brightcloud.com/tools/url-ip-lookup.php">https://www.brightcloud.com/tools/url-ip-lookup.php</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Zvelo</collab>
          </person-group>
          <source>zveloLIVE: check a URL</source>
          <year>2023</year>
          <access-date>2024-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://tools.zvelo.com">https://tools.zvelo.com</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bada</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nurse</surname>
              <given-names>JRC</given-names>
            </name>
          </person-group>
          <article-title>The social and psychological impact of cyberattacks</article-title>
          <source>Emerging Cyber Threats and Cognitive Vulnerabilities</source>
          <year>2020</year>
          <publisher-loc>Cambridge, Massachusetts</publisher-loc>
          <publisher-name>Academic Press</publisher-name>
          <fpage>73</fpage>
          <lpage>92</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Montag</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Baumeister</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Digital phenotyping and mobile sensing</article-title>
          <source>New Developments in Psychoinformatics</source>
          <year>2022</year>
          <publisher-loc>Berlin, Heidelberg, Dordrecht, and New York City</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>RK</given-names>
            </name>
          </person-group>
          <source>Case study research and applications: Design and methods. 6th ed</source>
          <year>2018</year>
          <publisher-loc>UK</publisher-loc>
          <publisher-name>Sage</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>KB</given-names>
            </name>
          </person-group>
          <source>Consumer fraud in the United States, 2011: The third FTC survey</source>
          <year>2013</year>
          <access-date>2022-03-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ftc.gov/sites/default/files/documents/reports/consumer-fraud-united-states-2011-third-ftc-survey/130419fraudsurvey_0.pdf">https://www.ftc.gov/sites/default/files/documents/reports/consumer-fraud-united-states-2011-third-ftc-survey/130419fraudsurvey_0.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Federal Trade Commission</collab>
          </person-group>
          <source>Gut check: a reference guide for media on spotting false weight loss claims</source>
          <year>2014</year>
          <access-date>2023-02-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ftc.gov/business-guidance/resources/gut-check-reference-guide-media-spotting-false-weight-loss-claims">https://www.ftc.gov/business-guidance/resources/gut-check-reference-guide-media-spotting-false-weight-loss-claims</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <source>Web of Trust</source>
          <year>2023</year>
          <access-date>2023-07-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mywot.com/">https://www.mywot.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Carlos A Almenara</collab>
          </person-group>
          <source>Uncovering the top non-advertising weight loss websites on Google: A data-mining approach</source>
          <access-date>2024-11-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://osf.io/xeajh">https://osf.io/xeajh</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
