<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Infodemiology</journal-id><journal-id journal-id-type="publisher-id">infodemiology</journal-id><journal-id journal-id-type="index">38</journal-id><journal-title>JMIR Infodemiology</journal-title><abbrev-journal-title>JMIR Infodemiology</abbrev-journal-title><issn pub-type="epub">2564-1891</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v5i1e66416</article-id><article-id pub-id-type="doi">10.2196/66416</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Assessing the Reliability and Validity of Principles for Health-Related Information on Social Media (PRHISM) for Evaluating Breast Cancer Treatment Videos on YouTube: Instrument Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Kusama</surname><given-names>Hiroki</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Takahashi</surname><given-names>Yoshimitsu</given-names></name><degrees>DrPH</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Orihara</surname><given-names>Shunichiro</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Adachi</surname><given-names>Kayo</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ishizuka</surname><given-names>Yumiko</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Semba</surname><given-names>Ryoko</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shima</surname><given-names>Hidetaka</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Horimoto</surname><given-names>Yoshiya</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kaise</surname><given-names>Hiroshi</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Taguri</surname><given-names>Masataka</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Inoue</surname><given-names>Sho</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Nakayama</surname><given-names>Takeo</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ishikawa</surname><given-names>Takashi</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Breast Surgical Oncology, Tokyo Medical University Hospital</institution><addr-line>6-7-1, Nishishinjuku, Shinjuku-ku</addr-line><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff2"><institution>Department of Implementation Science in Public Health, School of Public Health, Kyoto University</institution><addr-line>Kyoto</addr-line><country>Japan</country></aff><aff id="aff3"><institution>Department of Health Data Science, Tokyo Medical University Hospital</institution><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff4"><institution>Department of Breast Oncology, Faculty of Medicine, Juntendo University</institution><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff5"><institution>Department of Breast Surgery, Douaikai Ozawa Hospital</institution><addr-line>Kanagawa</addr-line><country>Japan</country></aff><aff id="aff6"><institution>Department of Breast Surgical Oncology, Tokyo Medical University Ibaraki Medical Center</institution><addr-line>Ibaraki</addr-line><country>Japan</country></aff><aff id="aff7"><institution>YCU Co-Creation Innovation Center, Yokohama City University</institution><addr-line>Kanagawa</addr-line><country>Japan</country></aff><aff id="aff8"><institution>Department of Health Informatics, School of Public Health, Kyoto University</institution><addr-line>Kyoto</addr-line><country>Japan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mackey</surname><given-names>Tim</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Agbede</surname><given-names>Moses</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Ehtesham</surname><given-names>Zarmina</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Hiroki Kusama, MD, PhD, Department of Breast Surgical Oncology, Tokyo Medical University Hospital, 6-7-1, Nishishinjuku, Shinjuku-ku, Tokyo, 160-0023, Japan, 81 3-3342-6111; <email>kusama.hiroki.8j@tokyo-med.ac.jp</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>11</day><month>6</month><year>2025</year></pub-date><volume>5</volume><elocation-id>e66416</elocation-id><history><date date-type="received"><day>19</day><month>09</month><year>2024</year></date><date date-type="rev-recd"><day>14</day><month>03</month><year>2025</year></date><date date-type="accepted"><day>19</day><month>03</month><year>2025</year></date></history><copyright-statement>&#x00A9; Hiroki Kusama, Yoshimitsu Takahashi, Shunichiro Orihara, Kayo Adachi, Yumiko Ishizuka, Ryoko Semba, Hidetaka Shima, Yoshiya Horimoto, Hiroshi Kaise, Masataka Taguri, Sho Inoue, Takeo Nakayama, Takashi Ishikawa. Originally published in JMIR Infodemiology (<ext-link ext-link-type="uri" xlink:href="https://infodemiology.jmir.org">https://infodemiology.jmir.org</ext-link>), 11.6.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Infodemiology, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://infodemiology.jmir.org/">https://infodemiology.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2025/1/e66416"/><abstract><sec><title>Background</title><p>There is breast cancer&#x2013;related medical information on social media, but there is no established method for objectively evaluating the quality of this information. Principles for Health-Related Information on Social Media (PRHISM) is a newly developed tool for objectively assessing the quality of health-related information on social media; however, there have been no reports evaluating its reliability and validity.</p></sec><sec><title>Objective</title><p>The purpose of this study was to statistically examine the reliability and validity of PRHISM using videos about breast cancer treatment on YouTube (Google).</p></sec><sec sec-type="methods"><title>Methods</title><p>In total, 60 YouTube videos were selected on January 5, 2024, with the Japanese words for &#x201C;breast cancer,&#x201D; &#x201C;treatment,&#x201D; and &#x201C;chemotherapy,&#x201D; and assessed by 6 Japanese physicians with expertise in breast cancer. These evaluators independently evaluated the videos using PRHISM and an established tool for assessing the quality of health-related information, DISCERN, as well as through subjective assessments. We calculated interrater and intrarater agreement among evaluators with CIs, measuring agreement using weighted Cohen kappa.</p></sec><sec sec-type="results"><title>Results</title><p>The interrater agreement for PRHISM overall quality was &#x03BA;=0.52 (90% CI 0.49-0.55), indicating that the expected level of agreement, statistically defined by the lower limit of the 90% CI exceeding 0.53, was not achieved. However, PRHISM demonstrated higher agreement compared with DISCERN overall quality, which had a &#x03BA;=0.45 (90% CI 0.41-0.48). In terms of validity, the intrarater agreement between PRHISM and subjective assessments by breast experts was &#x03BA;=0.37 (95% CI 0.14-0.60), while DISCERN showed an agreement of &#x03BA;=0.27 (95% CI 0.07-0.48), indicating fair agreement and no significant difference in validity.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>PRHISM has demonstrated sufficient reliability and validity for evaluating the quality of health-related information on YouTube, making it a promising new metric. To further enhance objectivity, it is necessary to explore the use of artificial intelligence and other approaches.</p></sec></abstract><kwd-group><kwd>information quality</kwd><kwd>social media</kwd><kwd>YouTube</kwd><kwd>PRHISM</kwd><kwd>breast cancer treatment</kwd><kwd>videos</kwd><kwd>reliability</kwd><kwd>validity</kwd><kwd>instrument validation study</kwd><kwd>medical information</kwd><kwd>online health information</kwd><kwd>cancer treatment</kwd><kwd>Japan</kwd><kwd>Principles for Health-Related Information on Social Media</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>In recent years, advances in medical technology and diagnostic methods have made health care increasingly complex, leading to a growing tendency for patients to seek information about their disease and treatments [<xref ref-type="bibr" rid="ref1">1</xref>]. Many patients feel anxious during this process, and internet use for collecting medical information is increasing [<xref ref-type="bibr" rid="ref2">2</xref>]. In Japan, about 50% of people use the internet as a method for collecting medical information [<xref ref-type="bibr" rid="ref3">3</xref>]. The sources of information include those officially provided by national cancer centers, as well as those from social media. On social media, anyone can post information regardless of their expertise or qualifications, making it very difficult for patients to judge the quality of that information, which is often a mix of reliable and unreliable sources [<xref ref-type="bibr" rid="ref4">4</xref>]. The spread of misinformation about vaccines during the COVID-19 pandemic highlighted the problem of inaccurate medical information on social media [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. In response to this issue, the National Academy of Medicine (NAM) published a guide in 2021 to help identify reliable sources of health information on social media [<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>Methods for objectively evaluating the quality of medical information available on the internet have included Diagnostic Information Support Communication Evaluation Report Network (DISCERN) [<xref ref-type="bibr" rid="ref7">7</xref>]. DISCERN was developed as a tool to assess the quality of written information about treatment choices. It is a metric that evaluates the quality of information using 16 questions, consisting of 15 basic assessments and 1 overall assessment, each scored on a 1 (No) to 5 (Yes) Likert scale. This metric has long been considered reliable and is currently used to assess the quality of breast cancer treatment information available on the internet [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. However, since they were developed before the year 2000 and were not designed with social media in mind, there are concerns that they may be inadequate for evaluating social media [<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>Given the increasing reliance on the internet for health information, it is crucial to ensure that the information available to patients is accurate and reliable. Misinformation can lead to incorrect self-diagnosis, inappropriate treatment choices, and increased anxiety, ultimately affecting patient outcomes and public health. Therefore, there is a pressing need to develop and validate tools specifically designed to evaluate the quality of medical information on social media platforms.</p><p>Denniss and colleagues [<xref ref-type="bibr" rid="ref10">10</xref>] developed the Principles for Health-Related Information on Social Media (PRHISM) tool to evaluate health-related information on social media using a modified Delphi method. This tool assesses 13 principles on a 0 (completely unmet)-4 (completely met) Likert scale and allows nonexperts to evaluate the quality of information, potentially reducing reviewer bias. Compared with existing metrics for evaluating information, PRHISM was specifically designed for social media, offering greater logical validity. Its questions are tailored for social media platforms, with additional considerations for readability and accommodations for vision and hearing impairments. Although PRHISM has not yet been widely used for social media evaluation, its development through appropriate methods and its adaptability suggest it could be valuable for this purpose.</p><p>To address these challenges, we adapted a Japanese version of PRHISM and evaluated its reliability and validity. We also conducted assessments using DISCERN, widely used for evaluating medical information quality, and compared the results with PRHISM. Our goal was to evaluate whether PRHISM could adequately assess information quality on Japanese social media and, using this tool, create an environment where patients can access accurate medical information.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Translation of the PRHISM</title><p>To use PRHISM in Japan, we obtained permission from the developers of PRHISM. First, PRHISM was translated from English to Japanese by a native Japanese speaker (H Kusama). Then, the Japanese version was back-translated into English by a native English speaker. Any discrepancies between the back-translated English version and the original text were identified, and the Japanese version appropriately adjusted (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s2-2"><title>Social Media Platform</title><p>The evaluation of PRHISM was conducted using YouTube (Google). YouTube is the second most used platform in Japan after LINE (LY Corporation) and is used across all age groups [<xref ref-type="bibr" rid="ref11">11</xref>]. Among various platforms, we determined that YouTube is suitable for this evaluation because it allows the posting of longer videos, enabling experts to adequately assess the medical information provided.</p></sec><sec id="s2-3"><title>How to Search</title><p>Since YouTube uses an algorithm that analyzes viewing history through artificial intelligence (AI) to prioritize related videos, searches were conducted using the internet browser Google Chrome in incognito mode, with no login session active. The search terms used were the Japanese words &#x201C;&#x4E73;&#x764C;&#x201D; (&#x306B;&#x3085;&#x3046;&#x304C;&#x3093;, Nyugan, breast cancer), &#x201C;&#x6CBB;&#x7642;&#x201D; (&#x3061;&#x308A;&#x3087;&#x3046;, Tiryou, treatment), and &#x201C;&#x6297;&#x764C;&#x5264;&#x201D; (&#x3053;&#x3046;&#x304C;&#x3093;&#x3056;&#x3044;, Kouganzai, chemotherapy). The search was conducted on January 5, 2024, and the results were sorted by relevance, with the videos listed in order from the top. The exclusion criteria were (1) languages other than Japanese, (2) fewer than 3000 views, (3) shorter than 60 seconds, (4) irrelevant videos, (5) without audio, (6) YouTube shorts, (7) duplicates, and (8) advertisements.</p><p>The sources of the videos were categorized into eight categories: (1) health profession schools and other educational institutions (schools of medicine, pharmacy, etc); (2) health care facilities (hospitals, clinics, etc); (3) nonprofit health plans; (4) public health departments (national statement, regional statement, etc); (5) individual health care professionals (doctors, nurses, occupational therapists, etc); (6) entertainment, media, news; (7) personal blogs; and (8) other.</p><p>These categories were created with reference to the reliable sources identified by the National Academy of Medicine [<xref ref-type="bibr" rid="ref4">4</xref>]. Categories 1&#x2010;4 were defined as content from reliable sources, while categories 5&#x2010;8 were defined as content from other sources. In addition, general information, such as the uploader, number of channel subscribers, number of views, video length, upload date, number of likes, and time since posting, was also collected.</p></sec><sec id="s2-4"><title>Evaluators</title><p>In total, 6 physicians with expertise in breast cancer conducted the evaluations. All of them were surgical oncologists, and the authors recruited participants from their own institution and affiliated hospitals for this study. : KA (8 y as a physician, 1 y as a breast expert), YI (9 y as a physician, 2 y as a breast expert), RS (10 y as a physician, 2 y as a breast expert), HS (16 y as a physician, 7 y as a breast expert), YH (24 y as a physician, 15 y as a breast expert), and H Kaise (37 y as a physician, 20 y as a breast expert).</p></sec><sec id="s2-5"><title>Evaluation Method</title><p>In total, 6 physicians with expertise in breast cancer evaluated a common set of 60 videos. For each video, they used PRHISM and DISCERN for evaluation. In addition, the accuracy and potential harm of the information was assessed.</p></sec><sec id="s2-6"><title>PRHISM</title><p>PRHISM evaluates the quality of health-related information on social media using 13 principles, which are scored on a 0&#x2010;4 Likert scale [<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>Since some items may not be applicable depending on the content of the video, the score is calculated based on the applicable questions and converted to a score out of 100 (PRHISM score). Scores of 100&#x2010;76 are rated as excellent, 75&#x2010;51 as good, 50&#x2010;26 as mediocre, and 25&#x2010;0 as poor (<xref ref-type="other" rid="box1">Textbox 1</xref>).</p><boxed-text id="box1"><title> Summary of the evaluation tools used in this study.</title><p><bold>Principles for Health-Related Information on Social Media (PRHISM)</bold></p><p>PRHISM is comprised of 13 principles. Each principle is scored on a 5-point Likert scale (0-4).</p><p>Principles:</p><list list-type="order"><list-item><p>Authorship</p></list-item><list-item><p>Authoritative</p></list-item><list-item><p>Action-oriented</p></list-item><list-item><p>Financial disclosure</p></list-item><list-item><p>Attribution</p></list-item><list-item><p>Balance and justifiability</p></list-item><list-item><p>Risks and benefits</p></list-item><list-item><p>Privacy</p></list-item><list-item><p>Complementary information</p></list-item><list-item><p>Referrals and support</p></list-item><list-item><p>Readability and comprehensibility</p></list-item><list-item><p>Accessibility</p></list-item><list-item><p>Images</p></list-item></list><p/><p><bold>DISCERN</bold></p><p>DISCERN is comprised of 8 reliability assessments, 7 information quality assessments, and one overall quality assessment. Each principle is scored on a 5-point Likert scale (1-5).</p><p>Reliability:</p><list list-type="order"><list-item><p>Are the aims clear?</p></list-item><list-item><p>Does it achieve its aims?</p></list-item><list-item><p>Is it relevant?</p></list-item><list-item><p>Is it clear what sources of information were used to compile the publication (other than the author or producer)?</p></list-item><list-item><p>Is it clear when the information used or reported in the publication was produced?</p></list-item><list-item><p>How good is the quality of information treatment choices?</p></list-item><list-item><p>Is it balanced and unbiased?</p></list-item><list-item><p>Does it provide details of additional sources of support and information?</p></list-item></list><p>Information quality:</p><list list-type="order"><list-item><p>Does it refer to areas of uncertainty?</p></list-item><list-item><p>Does it describe how each treatment works?</p></list-item><list-item><p>Does it describe the benefits of each treatment?</p></list-item><list-item><p>Does it describe the risks of each treatment?</p></list-item><list-item><p>Does it describe what would happen if no treatment is used?</p></list-item><list-item><p>Does it describe how the treatment choices affect overall quality of life?</p></list-item><list-item><p>Is it clear that there may be more than one possible treatment choice? Does it provide support for shared decision-making?</p></list-item></list><p>Overall evaluation:</p><list list-type="order"><list-item><p>Overall rating of the publications.</p></list-item></list><p/><p/><p><bold>Cancer Expert Assessment Tool</bold></p><p>Cancer expert assessment tool is comprised of 4 question assessments. Two assessments consist of whether the information is true or false and harmful or not harmful, and 2 review reasons why the evaluation was chosen.</p><p>Expert Panel Member Assessment:</p><list list-type="order"><list-item><p>In your opinion, are the primary medical claims within the article accurate?</p><list list-type="bullet"><list-item><p>5: True, 4: Mostly true, 3: Mixture both True/False, 2: Mostly False, 1: False.</p></list-item></list></list-item><list-item><p>If you answered, &#x201C;Mixture both True/False,&#x201D; &#x201C;Mostly False&#x201D; or &#x201C;False,&#x201D; why did you answer this way?</p></list-item><list-item><p>In your opinion, could the primary medical claims within the article cause harm?</p><list list-type="bullet"><list-item><p>5: Certainly NOT Harmful, 4: Probably NOT Harmful, 3: Uncertain, 2: Probably Harmful, 1: Certainly Harmful.</p></list-item></list></list-item><list-item><p>If you answered, &#x201C;Uncertain&#x201D; or &#x201C;Probably Harmful&#x201D; or &#x201C;Certainly Harmful,&#x201D; why did you answer this way?</p></list-item></list></boxed-text></sec><sec id="s2-7"><title>DISCERN</title><p>DISCERN evaluates the scientific reliability of medical information related to treatment descriptions and assigns a score [<xref ref-type="bibr" rid="ref8">8</xref>]. The total score is out of 80 points, with each of the 16 assessments contributing up to 5 points (DISCERN score) (<xref ref-type="other" rid="box1">Textbox 1</xref>).</p></sec><sec id="s2-8"><title>Accuracy and Potential Harm of the Information</title><p>The subjective assessment was conducted using an assessment tool developed by Johnson et al [<xref ref-type="bibr" rid="ref12">12</xref>]. This tool assesses whether the provided medical information is accurate or inaccurate, and if considered inaccurate, the reason is marked in a checkbox. In addition, it evaluates whether the information is harmful or not using the same tool. Accurate information is rated as 1, and inaccurate information as 5, on a Likert scale. Similarly, nonharmful information is rated as 1, and harmful information as 5. To align the scoring methods of PRHISM and DISCERN, in this study, accurate or nonharmful information was rated as 5, and inaccurate or harmful information was rated as 1 (<xref ref-type="other" rid="box1">Textbox 1</xref>).</p></sec><sec id="s2-9"><title>Training and Protocol for Evaluators</title><p>Each evaluator received a lecture once on how to use the metrics during a preliminary meeting. The principal investigator, who is also the first author of the study, conducted the lecture in an internet-based group session in a group session for approximately 60 minutes. Subsequently, evaluation sheets, along with Japanese translations of the PRHISM and DISCERN guides [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], were provided. The evaluators conducted their assessments based on these guides. No further training were conducted thereafter.</p><p>Discussion among evaluators regarding each evaluation was not permitted.</p></sec><sec id="s2-10"><title>Reliability</title><p>Reliability was assessed by examining the agreement of scores between evaluators. In the previous literature on DISCERN, evaluations were based on the agreement of the overall quality score. However, PRHISM does not have a corresponding criterion. For the purpose of statistical evaluation and comparison in this study, we added a &#x201C;PRHISM overall quality&#x201D; component, similar to that in DISCERN, which assessed the entire video after evaluating the 13 principles. This component was also scored on a 0&#x2010;4 Likert scale, and its agreement was evaluated.</p></sec><sec id="s2-11"><title>Validity</title><p>There is no gold standard for evaluating the validity of the quality of medical information. For validity, the subjective assessment of the quality of medical information by physicians with expertise in breast cancer was considered an appropriate assessment, and this was used as the standard for validity. Validity was assessed by examining the agreement between the PRHISM overall quality and the experts&#x2019; subjective assessments. The validity of DISCERN was also examined in the same way.</p></sec><sec id="s2-12"><title>Sample Size Determination</title><p>The number of videos to be evaluated was determined based on the interrater agreement for PRHISM overall quality. As there are no reports examining the level of interrater agreement for PRHISM, DISCERN was used as a reference. Currently, DISCERN is the primary tool used to evaluate the quality of medical information on social media. DISCERN assesses 15 criteria and then evaluates the overall quality of the information. In previous studies, the agreement on the overall quality has been evaluated. Cohen kappa was used to evaluate the degree of agreement. The degree of agreement varies depending on the expertise of the evaluators, with a kappa of 0.23 reported for self-help group members, 0.40 for information providers, and 0.53 for an expert [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>The expected agreement for PRHISM overall quality was assumed to have a threshold of &#x03BA;=0.53 and an expected value of &#x03BA;=0.61. The threshold of 0.53 was determined based on the assumption that PRHISM, being a tool specifically designed for evaluating social media, would achieve a higher level of agreement than DISCERN for an expert. The expected value of 0.61 is generally considered to indicate &#x201C;sufficient agreement&#x201D; in terms of the kappa coefficient [<xref ref-type="bibr" rid="ref14">14</xref>]. For the number of videos to be evaluated in this study, it was necessary to assume the distribution of the overall quality scores in PRHISM. Therefore, as a pilot test, the investigator (HK [Hiroki Kusama]) evaluated 50 videos to establish this distribution in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. Based on the above settings, the number of videos was determined through a simulation experiment conducted 10,000 times. Assuming an alternative hypothesis kappa coefficient of 0.61, the number of videos required to reject the null hypothesis of 0.53 with over 80% power at a 2-sided significance level of 10% was calculated to be 55 for 6 evaluators. The <italic>z</italic> test, approximated by a normal distribution, was used to calculate the test statistics [<xref ref-type="bibr" rid="ref15">15</xref>]. Anticipating that some videos might be difficult to evaluate, we decided to have 6 evaluators assess 60 videos. The 6 evaluators were distributed, with 3 physicians having more than 10 years of experience and 3 physicians having less than 10 years of experience.</p></sec><sec id="s2-13"><title>Statistical Analysis</title><p>The primary analysis focused on examining the interrater agreement for PRHISM overall quality (reliability of PRHISM) and DISCERN overall quality (reliability of DISCERN).</p><p>As secondary analyses, we examined the following:</p><list list-type="bullet"><list-item><p>The intrarater agreement between PRHISM overall quality and DISCERN overall quality.</p></list-item><list-item><p>The intrarater agreement between PRHISM overall quality and expert evaluations (validity of PRHISM).</p></list-item><list-item><p>The intrarater agreement between DISCERN overall quality and expert evaluations (validity of DISCERN).</p></list-item><list-item><p>The interrater agreement for PRHISM score and its categories (reliability of PRHISM).</p></list-item><list-item><p>The interrater agreement for DISCERN score and its categories (reliability of DISCERN).</p></list-item></list><p>To compare the DISCERN score with the PRHISM score, we calculated the modified DISCERN score by subtracting the DISCERN overall quality score from the total DISCERN score, dividing the result by the maximum possible score based on the number of applicable questions, and then converting it to a score out of 100 (modified DISCERN score).</p><p>The agreement of evaluations was assessed using the kappa coefficient. The interpretation of agreement levels is as follows: &#x003C;0.00 (no agreement); 0.00&#x2010;0.20 (slight); 0.21&#x2010;0.40 (fair); 0.41&#x2010;0.60 (moderate); 0.61&#x2010;0.80 (substantial); and 0.81&#x2010;1.00 (almost perfect) [<xref ref-type="bibr" rid="ref14">14</xref>]. The interobserver agreement was calculated using the kappa coefficient and a 90% CI, and an agreement level of 0.61 or higher was interpreted as sufficient.</p><p>For the interrater agreement of the PRHISM overall quality, 2 evaluators were selected from a group of 6, and the agreement for 15 different patterns was calculated. The average and the 90% CI were calculated [<xref ref-type="bibr" rid="ref15">15</xref>]. The 90% CI was calculated using normal approximation. If the lower limit of the 90% CI exceeded 0.53, the primary analysis (PRHISM reliability) was considered to have been achieved.</p><p>For the secondary analyses, the kappa coefficient and its 95% CI were calculated for each pair of evaluators to assess intrarater agreement. Secondary analyses for the interrater agreement were performed using the same approach as the primary analysis.</p><p>In addition, since the PRHISM score and the modified DISCERN score are continuous variables, we also performed an analysis using intraclass correlation coefficient. Statistical analyses were performed using R software (version 4.2.3; R Core Team).</p></sec><sec id="s2-14"><title>Ethical Considerations</title><p>The study was approved by the Institutional Review Board of Tokyo Medical University (T2024-0034). The study involved an analysis of publicly available YouTube data, which does not require individual consent from participants. However, ethical approval was obtained to ensure that the research adhered to institutional guidelines for research involving public data. No compensation was provided to participants as this study involved an analysis of publicly available data. Should any concerns or complaints be raised by video contributors or their families regarding ethical or social issues, the principal investigator will respond sincerely and appropriately in line with institutional procedures.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>Using the predefined search method, we excluded 5 videos in total (1 video with fewer than 3000 views and 4 videos with a duration of less than 1 minute), resulting in a list of 60 videos. A CONSORT (Consolidated Standards of Reporting Trials) diagram is shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Flowchart of video selection in this study. In total, 60 videos were selected after excluding those with fewer views or short duration.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e66416_fig01.png"/></fig><p>The median video length was 8 (range: 1&#x2010;126) minutes, the median number of views was 30,542.5 (range: 3921&#x2010;978,676), and the median time since posting was 29 (range: 7&#x2010;123) months. The sources of the videos were as follows: 5 individual health care professionals accounted for the largest category with 15 videos (25%); followed by 6 entertainment, media, and news with 13 videos (22%); 7 personal blogs with 12 videos (20%); 3 nonprofit health plans with 9 videos (15%); 1 health professions schools and other educational institutions with 6 videos (10%); 2 health care organizations with 4 videos (7%); and 8 other sources with 1 video (2%). No videos were posted from the public health departments (<xref ref-type="table" rid="table1">Table 1</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>The characteristics of selected videos on YouTube.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Characteristics</td><td align="left" valign="bottom">Statistical value (n=60)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Video length (mins), median (range)</td><td align="left" valign="top">8 (1-126)</td></tr><tr><td align="left" valign="top" colspan="2">Views, n (range)</td><td align="left" valign="top">30,542.5 (3921-978,676)</td></tr><tr><td align="left" valign="top" colspan="2">Time since posting (months), median (range)</td><td align="left" valign="top">29 (7-123)</td></tr><tr><td align="left" valign="top" colspan="2">Sources of videos, n (%)</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Health professions schools and other educational institutions (eg, medical schools and pharmacy schools)</td><td align="left" valign="top">6 (10)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Health care organizations (eg, academic medical centers and specialty hospitals)</td><td align="left" valign="top">4 (7)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Nonprofit health plans</td><td align="left" valign="top">9 (15)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Public health departments</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Individual health care professionals</td><td align="left" valign="top">15 (25)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Entertainment and media news</td><td align="left" valign="top">13 (22)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Breast cancer survivor&#x2019;s blog</td><td align="left" valign="top">12 (20)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Others</td><td align="left" valign="top">1 (2)</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Primary Analysis</title><sec id="s3-2-1"><title>Reliability</title><p>The interrater agreement for PRHISM overall quality was &#x03BA;=0.52 (90% CI 0.49-0.55), indicating moderate agreement. Since the lower limit of the 90% CI was below 0.53, the primary analysis was not achieved. However, the interrater agreement for DISCERN overall quality was &#x03BA;=0.45 (90% CI 0.41-0.48), also indicating moderate agreement. The 90% CI did not overlap, suggesting that PRHISM may be a superior measure in terms of interrater agreement compared with DISCERN (<xref ref-type="fig" rid="figure2">Figures 2</xref> and <xref ref-type="fig" rid="figure3">3</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Interrater agreement on PRHISM and DISCERN overall quality. The circle and triangle represent the mean kappa and CIs (90% CI) are represented by horizontal error bars. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; PRHISM: Principles for Health-Related Information on Social Media.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e66416_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Results of reliability and validity agreement. The circle represents the mean kappa and CIs (90 or 95% CI) are represented by horizontal error bars. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; ICC: intraclass correlation coefficients; NaN: not a number; PRHISM: Principles for Health-Related Information on Social Media.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e66416_fig03.png"/></fig></sec><sec id="s3-2-2"><title>Subgroup Analysis in Primary Analysis</title><p>For videos originating from reliable sources (categories 1&#x2010;4), the PRHISM overall quality was &#x03BA;=0.45 (90% CI 0.38-0.51), and the DISCERN overall quality was &#x03BA;=0.28 (90% CI 0.22-0.33). For videos from other sources (categories 5&#x2010;8), the PRHISM overall quality was &#x03BA;=0.40 (90% CI 0.36-0.44), and the DISCERN overall quality was &#x03BA;=0.34 (90% CI 0.30-0.38; <xref ref-type="fig" rid="figure3">Figure 3</xref>, <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). The 90% CI for PRHISM from reliable sources did not overlap with the 90% CI for DISCERN.</p><p>For those with over 10 years of experience, the PRHISM overall quality was &#x03BA;=0.57 (90% CI 0.51-0.63), and the DISCERN overall quality was &#x03BA;=0.60 (90% CI 0.54-0.65). For those with less than 10 years of experience, the PRHISM overall quality was &#x03BA;=0.30 (90% CI 0.20-0.40), and the DISCERN overall quality was &#x03BA;=0.21 (90% CI: 0.12-0.29). When the years of experience were 10 or more, the agreement on overall quality was higher for both PRHISM and DISCERN compared with those with less than 10 years of experience (<xref ref-type="fig" rid="figure3">Figure 3</xref>, <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>).</p></sec></sec><sec id="s3-3"><title>Secondary Analysis</title><p>Intrarater agreement for PRHISM overall quality and DISCERN overall quality was &#x03BA;=0.63 (95% CI 0.55-0.73), indicating substantial agreement. In evaluating medical information on social media, there was no significant difference between the assessments of PRHISM overall quality and DISCERN overall quality (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><p>The intrarater agreement among experts was &#x03BA;=0.54 (95% CI 0.50-0.57), indicating moderate agreement (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p></sec><sec id="s3-4"><title>Validity</title><p>We evaluated the agreement between the PRHISM overall quality and DISCERN overall quality scores with the quality of information as subjectively assessed by experts. The agreement between PRHISM overall quality and the experts&#x2019; subjective assessment was &#x03BA;=0.37 (95% CI 0.14-0.60), indicating fair agreement. The agreement between DISCERN overall quality and the experts&#x2019; subjective assessment was &#x03BA;=0.27 (95% CI 0.07-0.48), indicating fair agreement. The 95% CIs overlapped, suggesting that the validity was considered equivalent (<xref ref-type="fig" rid="figure3">Figures 3</xref> and <xref ref-type="fig" rid="figure4">4</xref>). The 95% CIs for the agreement of each of the 6 evaluators all overlapped, but the level of agreement varied among specialists for both PRHISM and DISCERN, ranging from &#x03BA;=0.07 to 0.65 and &#x03BA;=0.01 to 0.51, respectively. (<xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>).</p><p>The circle represents the mean kappa for PRHISM, and triangle represent the mean kappa for DISCERN. The 95% CIs are represented by horizontal error bars.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Intrarater agreement between PRHISM or DISCERN overall quality and expert opinion, the circle and triangle represent the mean kappa and CIs (95% CI) are represented by horizontal error bars. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; PRHISM: Principles for Health-Related Information on Social Media.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e66416_fig04.png"/></fig></sec><sec id="s3-5"><title>Agreement Between PRHISM Score and DISCERN Score</title><p>We evaluated the interrater agreement among 6 evaluators for the PRHISM score and the modified DISCERN score, both rated on a score out of 100. The interrater agreement for the PRHISM score and the modified DISCERN score was &#x03BA;=0.36 (95% CI 0.33-0.40) and &#x03BA;=0.40 (95% CI 0.37-0.43), respectively (<xref ref-type="fig" rid="figure5">Figure 5A</xref>). Using the intraclass correlation coefficient, the PRHISM score was 0.41 (95% CI 0.27-0.55) and the DISCERN score was 0.40 (95% CI 0.24-0.56) (<xref ref-type="fig" rid="figure5">Figure 5B</xref>).</p><p>The circle represents the mean kappa for PRHISM, and the triangle represent the mean kappa for DISCERN. The 95% CIs are represented by horizontal error bars.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Intra-rater agreement between PRHISM score and modified DISCERN score and expert opinion. The circle and triangle represents the mean kappa and 95% CIs are represented by horizontal error bars. (<bold>A</bold>) Cohen kappa. (<bold>B</bold>) Intraclass correlation coefficient. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; PRHISM: Principles for Health-Related Information on Social Media.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v5i1e66416_fig05.png"/></fig></sec><sec id="s3-6"><title>Agreement for Each Evaluation Question of PRHISM and DISCERN</title><p>For PRHISM, when a question was judged as &#x201C;not applicable,&#x201D; it was excluded from the score calculation. Therefore, some were assessed using unweighted Cohen kappa. The highest agreement was for question 2, &#x201C;authoritative,&#x201D; with &#x03BA;=0.73 (95% CI 0.70-0.76). For DISCERN, the highest agreement was for item 12, &#x201C;benefits of treatment,&#x201D; with &#x03BA;=0.60 (95% CI 0.56-0.63) (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><p>In addition, PRHISM is a metric that classifies video quality as poor, mediocre, good, or excellent based on the PRHISM score. We evaluated the agreement between the subjective assessments by experts and the PRHISM scoring classification. When assigning 1 to poor and 4 to excellent, the agreement was &#x03BA;=0.54 (95% CI 0.45-0.64), indicating moderate agreement (<xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>).</p></sec><sec id="s3-7"><title>Evaluation of the Quality of Breast Cancer Treatment Information on YouTube in Japan Using PRHISM and DISCERN Score</title><p>Although this study primarily examined the utility of PRHISM, we also evaluated the quality of breast cancer treatment information on YouTube in Japan using PRHISM and DISCERN scores. The mean PRHISM and DISCERN scores for medical information related to breast cancer treatment on Japanese YouTube were 60.6 (SD 11.5) and 58.9 (SD 11.5), respectively (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In evaluating the quality of medical information on YouTube, the interrater agreement for the overall quality score of PRHISM was &#x03BA;=0.52 (90% CI 0.49-0.55), and the primary end point was not achieved. However, the 90% CI for interrater agreement of PRHISM was superior to that of DISCERN, indicating that PRHISM is a more reliable metric when evaluating the quality of medical information on YouTube. In terms of validity, the agreement between the experts&#x2019; subjective assessment and PRHISM overall quality was &#x03BA;=0.37 (95% CI 0.14-0.60), indicating fair agreement. It was found that PRHISM has validity equivalent to that of DISCERN.</p><p>Although the primary end point was not achieved, 1 possible reason was the difficulty in setting the threshold and expected values for interrater agreement of PRHISM. In setting the threshold and expected values, we used DISCERN as a reference because no studies have examined the interrater agreement of PRHISM [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. While the number of evaluators and videos was determined statistically, it is possible that a larger number of both was necessary to adequately evaluate the quality of information. However, DISCERN was designed for books available in public libraries and bookstores, and leaflets produced by professional organizations and national self-help groups. We referred to studies that used DISCERN to evaluate medical information on social media, but many of them used a modified DISCERN with fewer evaluation items, making them difficult to reference [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. DISCERN was not developed for social media, so the agreement may differ from previous studies. In fact, the agreement for DISCERN in this study, which focused on social media, was 0.45, lower than the 0.53 reported in previous studies [<xref ref-type="bibr" rid="ref7">7</xref>] , suggesting that the threshold and expected values might have been better set slightly lower. Therefore, given the results obtained with this threshold, no definitive conclusion can be drawn about the robustness of PRHISM.</p><p>In previous studies, the agreement for DISCERN decreased depending on the profession of the evaluators [<xref ref-type="bibr" rid="ref7">7</xref>]. In this study as well, a difference in agreement was observed depending on whether the years of experience were 10 or more, or less than 10. Although PRHISM is designed to allow for evaluation by nonexperts, these results suggest that evaluations conducted by experts may be more accurate.</p><p>We also examined validity. However, there is no gold standard for evaluating the quality of medical information. Therefore, it is necessary to establish a consensus among experts. During the development of PRHISM, the modified Delphi method, a consensus-building technique, was used. In addition, we assessed validity by setting alternative criteria. In previous reports, some studies have assessed validity based on guidelines and evidence [<xref ref-type="bibr" rid="ref23">23</xref>] , while others have used expert evaluations as the standard [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref24">24</xref>] . In addition, there are studies that have used DISCERN as an alternative criterion. In this study, using expert evaluations as the standard, the agreement among experts was &#x03BA;=0.54 (95% CI 0.50-0.57), showing a moderate level of consistency. However, the agreement between the experts&#x2019; evaluations and PRHISM overall quality was &#x03BA;=0.37 (95% CI 0.14-0.60), showing only fair agreement. Nevertheless, since the agreement was comparable with that of DISCERN, it suggests that PRHISM is also sufficiently valid for evaluating the quality of information. The lack of strong agreement may be due to the inevitable subjectivity of the assessments, leading to variations in judgments based on each expert&#x2019;s preferences and perspectives. In fact, the level of agreement varied among experts (<xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). It can be considered to have at least comparable validity to DISCERN, but there may be a need to consider how to use this tool regarding its validity.</p></sec><sec id="s4-2"><title>Future Prospects</title><p>We aim to explore the use of AI to make the evaluation of medical information more objective, efficient, and with higher validity, allowing for the assessment of a larger volume of information in a shorter time. In fact, there are reports investigating whether AI can be used to evaluate online health information [<xref ref-type="bibr" rid="ref25">25</xref>] . This study demonstrated that PRHISM is a suitable tool for evaluating the quality of medical information on social media. Therefore, this research serves as an important first step toward further investigations using PRHISM to assess the quality of medical information in various social media contexts. If low-quality information could automatically trigger warnings, it would help ensure that patients receive higher-quality medical information. Future research will explore the extent to which AI can be integrated into the evaluation process.</p></sec><sec id="s4-3"><title>Limitations</title><p>This study has some limitations. First, the PRHISM overall quality is a metric independently established by the authors and was created specifically for statistical analysis. Since PRHISM is a tool that evaluates information using the PRHISM score or PRHISM scoring classification [<xref ref-type="bibr" rid="ref10">10</xref>], the study may not directly evaluate the tool itself.</p><p>Second, there was a small sample size and a limited number of evaluators. Although a statistically valid number was considered, there was variability in the evaluations among the experts, potentially influenced by differences in their years of clinical experience. This indicates that a larger sample size and a more diverse group of evaluators with varying levels of expertise might be needed. To address this issue, future studies could include standardized training modules to improve consistency. In addition, integrating AI could automate certain aspects of scoring, reducing human bias and increasing efficiency.</p><p>Third, this study presents results solely from Japan. There may be an influence on the results due to biases in breast cancer treatment practices and expertise in Japan, as well as differences in medical environments. In addition, this study was limited to information about breast cancer treatment on YouTube, and the findings may not be applicable to other diseases or health-related information on different social media platforms. Similar studies need to be conducted in other countries and on different social media platforms. Although YouTube has regulations on posted videos, some reports indicate that the quality of health-related videos on YouTube varies widely, from low to high. Therefore, further research is needed to determine whether PRHISM is effective for evaluating content in other countries or on different social media platforms, as this will enhance its utility and relevance globally. We plan to conduct evaluations on other social media platforms.</p></sec><sec id="s4-4"><title>Conclusions</title><p>PRHISM has greater reliability than DISCERN in evaluating the quality of medical information on social media, with comparable validity. It has the potential to become a standard metric for assessing the quality of medical information on social media.</p></sec></sec></body><back><ack><p>We would like to express our sincere gratitude to Denniss for granting us permission to use the PRHISM (Principles for Health-Related Information on Social Media) in this study. We thank Crimson Interactive Pvt Ltd (Ulatus) for their assistance in manuscript translation and editing.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>H Kusama contributed to conceptualization, data curation, formal analysis, investigation, methodology, visualization, and writing &#x2013; original draft. YT contributed to conceptualization, methodology, and writing &#x2013; review and editing. SO contributed to formal analysis. KA, YI, RS, HS, and H Kaise contributed to resources. YH contributed to resources and writing &#x2013; review and editing. MT contributed to formal analysis. SI and TN contributed to conceptualization. TI handled the project administration and writing &#x2013; review and editing.</p></fn><fn fn-type="conflict"><p>YT is employed through a joint research fund between Kyoto University and HealthTech Laboratory Inc. The authors declare that this relationship had no influence on the study design, data collection, analysis, interpretation, or manuscript preparation.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">CONSORT</term><def><p>Consolidated Standards of Reporting Trials</p></def></def-item><def-item><term id="abb3">DISCERN</term><def><p>Diagnostic Information Support Communication Evaluation Report Network</p></def></def-item><def-item><term id="abb4">PRHISM</term><def><p>Principles for Health-Related Information on Social Media</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zeraatkar</surname><given-names>D</given-names> </name><name name-style="western"><surname>Obeda</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ginsberg</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Hirsh</surname><given-names>J</given-names> </name></person-group><article-title>The development and validation of an instrument to measure the quality of health research reports in the lay media</article-title><source>BMC Public Health</source><year>2017</year><month>04</month><day>20</day><volume>17</volume><issue>1</issue><fpage>343</fpage><pub-id pub-id-type="doi">10.1186/s12889-017-4259-y</pub-id><pub-id pub-id-type="medline">28427426</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McMullan</surname><given-names>M</given-names> </name></person-group><article-title>Patients using the internet to obtain health information: how this affects the patient-health professional relationship</article-title><source>Patient Educ Couns</source><year>2006</year><month>10</month><volume>63</volume><issue>1-2</issue><fpage>24</fpage><lpage>28</lpage><pub-id pub-id-type="doi">10.1016/j.pec.2005.10.006</pub-id><pub-id pub-id-type="medline">16406474</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>Telecommunication usage trend survey 2023</article-title><source>Information &#x0026; Communications Statistics Database</source><year>2023</year><access-date>2024-02-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.soumu.go.jp/johotsusintokei/statistics/statistics05.html">https://www.soumu.go.jp/johotsusintokei/statistics/statistics05.html</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kington</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Arnesen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chou</surname><given-names>WYS</given-names> </name><name name-style="western"><surname>Curry</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Lazer</surname><given-names>D</given-names> </name><name name-style="western"><surname>Villarruel</surname><given-names>AM</given-names> </name></person-group><article-title>Identifying credible sources of health information in social media: principles and attributes</article-title><source>NAM Perspect</source><year>2021</year><volume>2021</volume><fpage>34611600</fpage><pub-id pub-id-type="doi">10.31478/202107a</pub-id><pub-id pub-id-type="medline">34611600</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Suarez-Lledo</surname><given-names>V</given-names> </name><name name-style="western"><surname>Alvarez-Galvez</surname><given-names>J</given-names> </name></person-group><article-title>Prevalence of health misinformation on social media: systematic review</article-title><source>J Med Internet Res</source><year>2021</year><month>01</month><day>20</day><volume>23</volume><issue>1</issue><fpage>e17187</fpage><pub-id pub-id-type="doi">10.2196/17187</pub-id><pub-id pub-id-type="medline">33470931</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>KA</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>MP</given-names> </name><etal/></person-group><article-title>Associations between COVID-19 misinformation exposure and belief with COVID-19 knowledge and preventive behaviors: cross-sectional online study</article-title><source>J Med Internet Res</source><year>2020</year><month>11</month><day>13</day><volume>22</volume><issue>11</issue><fpage>e22205</fpage><pub-id pub-id-type="doi">10.2196/22205</pub-id><pub-id pub-id-type="medline">33048825</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charnock</surname><given-names>D</given-names> </name><name name-style="western"><surname>Shepperd</surname><given-names>S</given-names> </name><name name-style="western"><surname>Needham</surname><given-names>G</given-names> </name><name name-style="western"><surname>Gann</surname><given-names>R</given-names> </name></person-group><article-title>DISCERN: an instrument for judging the quality of written consumer health information on treatment choices</article-title><source>J Epidemiol Community Health</source><year>1999</year><month>02</month><volume>53</volume><issue>2</issue><fpage>105</fpage><lpage>111</lpage><pub-id pub-id-type="doi">10.1136/jech.53.2.105</pub-id><pub-id pub-id-type="medline">10396471</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Blackwood</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>FC</given-names> </name><name name-style="western"><surname>Hong</surname><given-names>NJL</given-names> </name><name name-style="western"><surname>Gagliardi</surname><given-names>AR</given-names> </name></person-group><article-title>Quality of DCIS information on the internet: a content analysis</article-title><source>Breast Cancer Res Treat</source><year>2019</year><month>09</month><volume>177</volume><issue>2</issue><fpage>295</fpage><lpage>305</lpage><pub-id pub-id-type="doi">10.1007/s10549-019-05315-8</pub-id><pub-id pub-id-type="medline">31214858</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Iesato</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fushimi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tahara</surname><given-names>R</given-names> </name><etal/></person-group><article-title>A novel system to provide information via online YouTube videos and an evaluation of current online information about hereditary breast cancer</article-title><source>Breast Cancer</source><year>2024</year><month>01</month><volume>31</volume><issue>1</issue><fpage>63</fpage><lpage>74</lpage><pub-id pub-id-type="doi">10.1007/s12282-023-01512-y</pub-id><pub-id pub-id-type="medline">37995024</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Denniss</surname><given-names>E</given-names> </name><name name-style="western"><surname>Lindberg</surname><given-names>R</given-names> </name><name name-style="western"><surname>McNaughton</surname><given-names>SA</given-names> </name></person-group><article-title>Development of principles for health-related information on social media: Delphi study</article-title><source>J Med Internet Res</source><year>2022</year><month>09</month><day>8</day><volume>24</volume><issue>9</issue><fpage>e37337</fpage><pub-id pub-id-type="doi">10.2196/37337</pub-id><pub-id pub-id-type="medline">36074544</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="web"><article-title>Social media stats Japan</article-title><source>Statcounter Global Stats</source><year>2024</year><access-date>2025-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://gs.statcounter.com/social-media-stats/all/japan">https://gs.statcounter.com/social-media-stats/all/japan</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Parsons</surname><given-names>M</given-names> </name><name name-style="western"><surname>Dorff</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Cancer misinformation and harmful information on Facebook and other social media: a brief report</article-title><source>J Natl Cancer Inst</source><year>2022</year><month>07</month><day>11</day><volume>114</volume><issue>7</issue><fpage>1036</fpage><lpage>1039</lpage><pub-id pub-id-type="doi">10.1093/jnci/djab141</pub-id><pub-id pub-id-type="medline">34291289</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Charnock</surname><given-names>D</given-names> </name></person-group><source>The DISCERN Handbook: Quality Criteria for Consumer Health Information on Treatment Choices University of Oxford and The British Library</source><year>1998</year><publisher-name>Radcliffe Medical Press</publisher-name></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Landis</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Koch</surname><given-names>GG</given-names> </name></person-group><article-title>The measurement of observer agreement for categorical data</article-title><source>Biometrics</source><year>1977</year><month>03</month><volume>33</volume><issue>1</issue><fpage>159</fpage><lpage>174</lpage><pub-id pub-id-type="doi">10.2307/2529310</pub-id><pub-id pub-id-type="medline">843571</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Fleiss</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Levin</surname><given-names>B</given-names> </name><name name-style="western"><surname>Paik</surname><given-names>MC</given-names> </name></person-group><source>Statistical Methods for Rates and Proportions</source><year>2003</year><edition>3</edition><publisher-name>John Wiley &#x0026; Sons, Inc</publisher-name><fpage>xxvii</fpage><lpage>760</lpage><pub-id pub-id-type="other">0471526290</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aktas</surname><given-names>BK</given-names> </name><name name-style="western"><surname>Demirel</surname><given-names>D</given-names> </name><name name-style="western"><surname>Celikkaleli</surname><given-names>F</given-names> </name><etal/></person-group><article-title>YouTube as a source of information on prostatitis: a quality and reliability analysis</article-title><source>Int J Impot Res</source><year>2024</year><month>05</month><volume>36</volume><issue>3</issue><fpage>242</fpage><lpage>247</lpage><pub-id pub-id-type="doi">10.1038/s41443-023-00666-9</pub-id><pub-id pub-id-type="medline">36646834</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>&#x00C7;intesun</surname><given-names>FN&#x0130;</given-names> </name><name name-style="western"><surname>&#x00C7;intesun</surname><given-names>E</given-names> </name><name name-style="western"><surname>Se&#x00E7;ilmi&#x015F;</surname><given-names>&#x00D6;</given-names> </name></person-group><article-title>YouTube as a source of information on gonadotropin self-injections</article-title><source>Eur J Obstet Gynecol Reprod Biol</source><year>2021</year><month>09</month><volume>264</volume><issue>135-40</issue><fpage>135</fpage><lpage>140</lpage><pub-id pub-id-type="doi">10.1016/j.ejogrb.2021.07.015</pub-id><pub-id pub-id-type="medline">34303073</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gul</surname><given-names>M</given-names> </name><name name-style="western"><surname>Diri</surname><given-names>MA</given-names> </name></person-group><article-title>YouTube as a source of information about premature ejaculation treatment</article-title><source>J Sex Med</source><year>2019</year><month>11</month><volume>16</volume><issue>11</issue><fpage>1734</fpage><lpage>1740</lpage><pub-id pub-id-type="doi">10.1016/j.jsxm.2019.08.008</pub-id><pub-id pub-id-type="medline">31522984</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khatri</surname><given-names>P</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Belani</surname><given-names>NK</given-names> </name><etal/></person-group><article-title>YouTube as source of information on 2019 novel coronavirus outbreak: a cross sectional study of English and Mandarin content</article-title><source>Travel Med Infect Dis</source><year>2020</year><month>05</month><volume>35</volume><issue>101636</issue><fpage>101636</fpage><pub-id pub-id-type="doi">10.1016/j.tmaid.2020.101636</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kidy</surname><given-names>S</given-names> </name><name name-style="western"><surname>McGoldrick</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Stockton</surname><given-names>P</given-names> </name></person-group><article-title>YouTube as a source of information on extraction of third molars</article-title><source>Oral Maxillofac Surg</source><year>2021</year><month>12</month><volume>25</volume><issue>4</issue><fpage>519</fpage><lpage>524</lpage><pub-id pub-id-type="doi">10.1007/s10006-021-00941-3</pub-id><pub-id pub-id-type="medline">33608797</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martinez</surname><given-names>VH</given-names> </name><name name-style="western"><surname>Ojo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gutierrez-Naranjo</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Proffitt</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hartzler</surname><given-names>RU</given-names> </name></person-group><article-title>The most popular YouTube videos about shoulder replacement are of poor quality for patient education</article-title><source>Arthrosc Sports Med Rehabil</source><year>2023</year><month>06</month><volume>5</volume><issue>3</issue><fpage>e623</fpage><lpage>e628</lpage><pub-id pub-id-type="doi">10.1016/j.asmr.2023.03.001</pub-id><pub-id pub-id-type="medline">37388878</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Reddy</surname><given-names>R</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jufas</surname><given-names>N</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>N</given-names> </name></person-group><article-title>Assessing the quality of patient information for cholesteatoma on the video sharing platform YouTube</article-title><source>Otol Neurotol</source><year>2023</year><month>04</month><day>1</day><volume>44</volume><issue>4</issue><fpage>e230</fpage><lpage>e234</lpage><pub-id pub-id-type="doi">10.1097/MAO.0000000000003824</pub-id><pub-id pub-id-type="medline">36706445</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Robillard</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Jun</surname><given-names>JH</given-names> </name><name name-style="western"><surname>Lai</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Feng</surname><given-names>TL</given-names> </name></person-group><article-title>The QUEST for quality online health information: validation of a short quantitative tool</article-title><source>BMC Med Inform Decis Mak</source><year>2018</year><month>10</month><day>19</day><volume>18</volume><issue>1</issue><fpage>87</fpage><pub-id pub-id-type="doi">10.1186/s12911-018-0668-9</pub-id><pub-id pub-id-type="medline">30340488</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kureyama</surname><given-names>N</given-names> </name><name name-style="western"><surname>Terada</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kusudo</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Fact-checking cancer information on social media in Japan: retrospective study using Twitter</article-title><source>JMIR Form Res</source><year>2023</year><month>09</month><day>6</day><volume>7</volume><fpage>e49452</fpage><pub-id pub-id-type="doi">10.2196/49452</pub-id><pub-id pub-id-type="medline">37672310</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kinkead</surname><given-names>L</given-names> </name><name name-style="western"><surname>Allam</surname><given-names>A</given-names> </name><name name-style="western"><surname>Krauthammer</surname><given-names>M</given-names> </name></person-group><article-title>AutoDiscern: rating the quality of online health information with hierarchical encoder attention-based neural networks</article-title><source>BMC Med Inform Decis Mak</source><year>2020</year><month>06</month><day>9</day><volume>20</volume><issue>1</issue><fpage>104</fpage><pub-id pub-id-type="doi">10.1186/s12911-020-01131-z</pub-id><pub-id pub-id-type="medline">32517759</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>PRHISM English translation. PRHISM: Principles for Health-Related Information on Social Media.</p><media xlink:href="infodemiology_v5i1e66416_app1.docx" xlink:title="DOCX File, 28 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Result of pilot study. The results of an evaluation of the top 50 YouTube videos searched by the representative (H Kusama). The search terms, search method, and exclusion criteria are the same as those used in this study. The y-axis indicates the number of videos, while the x-axis represents the PRHISM overall quality score. PRHISM: Principles for Health-Related Information on Social Media.</p><media xlink:href="infodemiology_v5i1e66416_app2.pptx" xlink:title="PPTX File, 41 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Intrarater agreement between PRHISM/DISCERN overall quality and each expert opinion. The y-axis displays the initials of the breast experts who made the assessments. The circle represents the mean kappa for PRHISM, and the triangle represent the mean kappa for DISCERN. The 95% CIs are represented by horizontal error bars. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; PRHISM: Principles for Health-Related Information on Social Media.</p><media xlink:href="infodemiology_v5i1e66416_app3.pptx" xlink:title="PPTX File, 118 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Subgroup analysis of interrater agreement on PRHISM and DISCERN. The y-axis displays the initials of the breast experts, divided by experience level (over 10 years and 10 years or less). The circle represents the mean kappa for PRHISM, and the triangle represent the mean kappa for DISCERN. The 95% CIs are represented by horizontal error bars. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; PRHISM: Principles for Health-Related Information on Social Media.</p><media xlink:href="infodemiology_v5i1e66416_app4.pptx" xlink:title="PPTX File, 248 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Subgroup analysis of interrater agreement on PRHISM and DISCERN. The y-axis displays the initials of the breast experts, divided by video categories (1&#x2013;4 and 5&#x2013;8). The circle represents the mean kappa for PRHISM, and the triangle represent the mean kappa for DISCERN. The 95% CIs are represented by horizontal error bars. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; PRHISM: Principles for Health-Related Information on Social Media.</p><media xlink:href="infodemiology_v5i1e66416_app5.pptx" xlink:title="PPTX File, 195 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Intrarater agreement between PRHISM score classification and expert opinion. The y-axis displays the initials of the breast experts who made the assessments. The 95% CIs are represented by horizontal error bars. PRHISM: Principles for Health-Related Information on Social Media.</p><media xlink:href="infodemiology_v5i1e66416_app6.pptx" xlink:title="PPTX File, 107 KB"/></supplementary-material><supplementary-material id="app7"><label>Multimedia Appendix 7</label><p>PRHISM and DISCERN Scores for evaluating medical information on Japanese YouTube. Box plots showing the distribution of PRHISM and DISCERN scores for medical information related to breast cancer treatment on Japanese YouTube. The boxes represent the IQR, with the horizontal line indicating the median. The vertical extending lines shows the minimum and maximum values within 1.5 times the IQR. DISCERN: Diagnostic Information Support Communication Evaluation Report Network; PRHISM: Principles for Health-Related Information on Social Media.</p><media xlink:href="infodemiology_v5i1e66416_app7.pptx" xlink:title="PPTX File, 48 KB"/></supplementary-material></app-group></back></article>