<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Infodemiology</journal-id><journal-id journal-id-type="publisher-id">infodemiology</journal-id><journal-id journal-id-type="index">38</journal-id><journal-title>JMIR Infodemiology</journal-title><abbrev-journal-title>JMIR Infodemiology</abbrev-journal-title><issn pub-type="epub">2564-1891</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v6i1e78843</article-id><article-id pub-id-type="doi">10.2196/78843</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Audience-Specific Health Communication: Mixed Methods Evaluation of the Maria Ci&#x00EA;ncia AI-Assisted Knowledge Translation Tool</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Ara&#x00FA;jo-Pereira</surname><given-names>Mariana</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Villalva-Serra Jr</surname><given-names>Klauss</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Pires-Ramos</surname><given-names>Gustavo</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sousa-Peres</surname><given-names>Beatriz</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Concei&#x00E7;&#x00E3;o-Oliveira</surname><given-names>Joan&#x00E3; Nascimento</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Maiche</surname><given-names>Sarah Dourado</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Silva</surname><given-names>Rebeca Rebou&#x00E7;as da Cunha</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Andrade</surname><given-names>Bruno de Bezerril</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Laborat&#x00F3;rio de Pesquisa Cl&#x00ED;nica e Translacional, Instituto Gon&#x00E7;alo Moniz</institution><addr-line>R Waldemar Falc&#x00E3;o 121</addr-line><addr-line>Salvador</addr-line><country>Brazil</country></aff><aff id="aff2"><institution>Universidade Federal da Bahia</institution><addr-line>Salvador</addr-line><country>Brazil</country></aff><aff id="aff3"><institution>Curso de Mestrado de Tecnologias em Sa&#x00FA;de, Escola Bahiana de Medicina e Sa&#x00FA;de P&#x00FA;blica</institution><addr-line>Salvador</addr-line><country>Brazil</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Haupt</surname><given-names>Michael</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Lee</surname><given-names>Seung Won</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Liang</surname><given-names>Xiaolong</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Bruno de Bezerril Andrade, MD, PhD, Laborat&#x00F3;rio de Pesquisa Cl&#x00ED;nica e Translacional, Instituto Gon&#x00E7;alo Moniz, R Waldemar Falc&#x00E3;o 121, Salvador, 40296-710, Brazil, 1 7131762022; <email>brunobezerril@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>3</day><month>3</month><year>2026</year></pub-date><volume>6</volume><elocation-id>e78843</elocation-id><history><date date-type="received"><day>10</day><month>06</month><year>2025</year></date><date date-type="rev-recd"><day>23</day><month>12</month><year>2025</year></date><date date-type="accepted"><day>23</day><month>12</month><year>2025</year></date></history><copyright-statement>&#x00A9; Mariana Ara&#x00FA;jo-Pereira, Klauss Villalva-Serra Jr, Gustavo Pires-Ramos, Beatriz Sousa-Peres, Joan&#x00E3; Nascimento Concei&#x00E7;&#x00E3;o-Oliveira, Sarah Dourado Maiche, Rebeca Rebou&#x00E7;as da Cunha Silva, Bruno de Bezerril Andrade. Originally published in JMIR Infodemiology (<ext-link ext-link-type="uri" xlink:href="https://infodemiology.jmir.org">https://infodemiology.jmir.org</ext-link>), 3.3.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Infodemiology, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://infodemiology.jmir.org/">https://infodemiology.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2026/1/e78843"/><abstract><sec><title>Background</title><p>Scientific misinformation remains a major barrier to effective health communication. Bridging the gap between academic research and public understanding requires tools that simplify scientific language and adapt content to diverse audiences.</p></sec><sec><title>Objective</title><p>This study presents Maria Ci&#x00EA;ncia (LPCT-IGM), a specialized GPT-based assistant for science communication. The tool supports researchers in translating peer-reviewed scientific findings through simple prompts into accessible, ethically appropriate materials tailored for children, the general public, health professionals, and policymakers.</p></sec><sec sec-type="methods"><title>Methods</title><p>The tool was configured using prompt engineering techniques and guided by curated reference materials on inclusive and nonstigmatizing scientific language. Materials derived from 47 public health papers resulted in 188 outputs, which were assessed by 121 evaluators using 4 criteria: clarity, level of detail, language suitability, and content quality. In addition, outputs generated by Maria Ci&#x00EA;ncia were compared with those produced by a base large language model and with human-written science communication materials. Readability and linguistic accessibility were assessed using multiple established metrics.</p></sec><sec sec-type="results"><title>Results</title><p>Worldwide, mean scores were high: clarity (4.90), language suitability (4.78), content quality (4.72), and level of detail (4.56), on a 5-point scale. Materials for children and the general public consistently achieved the highest ratings across all criteria. A targeted comparison with the base large language model demonstrated superior performance of Maria Ci&#x00EA;ncia in contextual stability. Readability analyses indicated that Maria Ci&#x00EA;ncia&#x2019;s outputs were significantly more accessible than human-written texts, while maintaining high legibility classifications.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Maria Ci&#x00EA;ncia demonstrates the potential of artificial intelligence&#x2013;assisted tools to enhance knowledge translation and counter scientific misinformation by producing scalable, audience-specific content that balances accessibility and informational integrity.</p></sec></abstract><kwd-group><kwd>science communication</kwd><kwd>custom GPT</kwd><kwd>public health</kwd><kwd>scientific literacy</kwd><kwd>education</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Scientific misinformation is one of the most pressing challenges of our time, with direct consequences for public trust, the implementation of health policies, and the protection of population health [<xref ref-type="bibr" rid="ref1">1</xref>]. The COVID-19 pandemic sharply illustrated how inaccurate or distorted information can compromise collective responses, with measurable impacts on morbidity and mortality [<xref ref-type="bibr" rid="ref2">2</xref>]. The term &#x201C;infodemic,&#x201D; adopted by the World Health Organization, refers to the overwhelming volume of both accurate and misleading content that undermines access to trustworthy guidance. This phenomenon is amplified by digital platforms and social media, where misinformation spreads faster than corrective content. Efforts to manage infodemics have become a policy priority for global and national institutions, particularly in response to phenomena such as vaccine hesitancy, which has been linked to the resurgence of diseases such as measles.</p><p>Addressing misinformation requires more than reactive fact-checking; it demands the proactive translation of scientific knowledge into accessible, contextually relevant communication. Effective communication must also be timely, audience-centered, and grounded in the social and cultural contexts of the target populations. However, the scientific community itself often struggles to engage effectively with nonspecialist audiences. The persistence of a publication-centered academic culture, combined with time constraints and a lack of training, limits researchers&#x2019; ability to participate in outreach activities [<xref ref-type="bibr" rid="ref3">3</xref>]. While efforts to integrate science communication into academic curricula are increasing, there remains a need for structural support and practical tools to facilitate engagement beyond scholarly environments.</p><p>Recent advances in artificial intelligence (AI) have expanded its application beyond clinical decision support into health communication and knowledge translation. Capability- and function-oriented reviews of AI in health care have highlighted a growing shift toward systems designed to support information delivery, user engagement, and audience adaptation, rather than exclusively diagnostic or predictive tasks. These perspectives emphasize that the value of AI in health increasingly depends on how effectively systems align outputs with user needs, contexts, and levels of expertise. In parallel, research on explainable AI has underscored transparency, interpretability, and usability as central requirements for trust, acceptance, and ethical deployment, particularly in health-related applications [<xref ref-type="bibr" rid="ref4">4</xref>]. Although explainable AI has been extensively discussed in the context of clinical decision support systems, its core principles are equally relevant for health communication tools that aim to produce clear, audience-appropriate, and trustworthy content.</p><p>This paper presents Maria Ci&#x00EA;ncia: an AI-assisted platform designed to translate scientific content into tailored, accessible formats for diverse audiences. Developed using a custom GPT model, the tool supports researchers in generating science communication materials adapted for children, adults with low literacy, health professionals, and decision-makers. Importantly, Maria Ci&#x00EA;ncia is not intended to function as a clinical decision support system, nor to generate diagnostic or therapeutic recommendations. Instead, it operates as an audience-facing knowledge translation tool, focused on mediating peer-reviewed scientific evidence into formats appropriate for different levels of literacy, expertise, and social context.</p><p>The platform was created with the goal of enhancing the reach and impact of health-related scientific information, particularly in contexts where misinformation can influence individual behaviors and public health outcomes. The approach integrates AI with ethical oversight, thematic supervision, and practical communication strategies, aligning with emerging efforts to design responsible, user-centered AI systems for health communication. In contrast to generic chatbot applications, Maria Ci&#x00EA;ncia is grounded in bioethical principles, equity-driven design, and a commitment to cultural and educational inclusivity. By enabling the same scientific input to be transformed into multiple outputs, the platform offers a scalable and adaptable response to the challenges of misinformation and scientific inaccessibility in public health and beyond.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>This study presents the development and evaluation of Maria Ci&#x00EA;ncia, an AI-powered assistant designed to translate peer-reviewed research into audience-specific communication products. The tool was developed with the objective of promoting inclusive, accurate, and culturally sensitive dissemination of scientific knowledge, particularly in the field of public health. The methodological approach combined AI-supported content generation, audience-specific language adaptation, and empirical evaluation based on stakeholder feedback.</p></sec><sec id="s2-2"><title>Creation and Structure of the Tool</title><p>Maria Ci&#x00EA;ncia was developed on the ChatGPT Plus (OpenAI) platform, a commercial version of ChatGPT (OpenAI) that allows for the creation of customized GPTs (also known as AI assistants) through detailed configuration of instructions, role definitions, and operational parameters. The primary function of Maria Ci&#x00EA;ncia is to enable researchers to input scientific materials, such as peer-reviewed papers, and select the intended target audience. Based on this input, the assistant generates adapted communication materials suitable for various reader profiles, including children, the general population, health professionals, and policy decision-makers. These outputs are designed to be practical for use in educational, clinical, and public outreach contexts. ChatGPT is an AI-generated content developed by OpenAI that uses a transformer decoder-only architecture. The GPT model used in this approach was ChatGPT 4.5, released in February 2025. This version stands out as one of the most current versions alongside the ChatGPT o4-mini version, achieving in accuracy tests a 62.5% correctness rate, the highest value in software quality tests among the versions, and the lowest hallucination rate at 37.1%.</p></sec><sec id="s2-3"><title>Prompt Configuration and Operational Guidelines</title><p>The Maria Ci&#x00EA;ncia assistant was configured through prompt engineering techniques combined with a carefully curated set of reference documents that established linguistic, ethical, and stylistic parameters. This configuration aimed to guide the assistant in generating respectful, inclusive, and audience-appropriate outputs. Training the AI assistant with carefully selected documentation greatly improves the accuracy and relevance of its responses [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. In this study, we used reference materials on scientific dissemination, inclusive languages, and health dictionaries to fine-tune the model. Of note, the tool was initially tested in Brazilian Portuguese.</p><p>The assistant was assigned the explicit role of a Specialized Science Communicator, with advanced knowledge in public health, immunology, infectious and chronic diseases, and health communication. Its core objective was to translate complex scientific knowledge into formats that could be readily understood by diverse audiences. The interaction protocol included three primary steps: (1) understanding user needs: prompting users to specify the target audience (children, general public, health students, or health managers), (2) continuous engagement: encouraging deeper interaction through follow-up questions, and (3) final content generation: producing the final adapted text aligned with the audience&#x2019;s profile.</p><p>Content adaptation guidelines were explicitly defined for each audience segment: (1) children: playful and narrative-driven writing inspired by Writing for Young Minds, incorporating contextual summaries and storytelling techniques; (2) general public: simplification of scientific concepts with actionable health information, drawing from accessible Brazilian sources such as Superinteressante and Profiss&#x00E3;o Biotec; (3) health students: simplified explanations while maintaining technical terminology, with emphasis on key health concepts; and (4) health professionals and managers: structured summaries including population characteristics, methodological overviews, and actionable public health recommendations (typically 5 suggested policy improvements).</p><p>Additionally, for social media content, the assistant adapted outputs for platforms such as Instagram (Meta) and LinkedIn, ensuring appropriate tone, hashtags, and visual alignment for each context.</p></sec><sec id="s2-4"><title>Training Materials</title><p>Among the sources used were the &#x201C;Na ponta das l&#x00ED;nguas: pequeno gloss&#x00E1;rio para apoiar o enfrentamento do estigma e da discrimina&#x00E7;&#x00E3;o,&#x201D; carried out with the support of the Brazilian Ministry of Health, which offers terminology to reduce stigma in health communication [<xref ref-type="bibr" rid="ref7">7</xref>], as well as the &#x201C;UNAIDS Terminology Guidelines&#x201D; [<xref ref-type="bibr" rid="ref8">8</xref>], which provide recommendations for respectful and accurate language related to HIV and global health. The &#x201C;Global TB Dictionary&#x201D; was used to ensure technical accuracy in tuberculosis-related content, and also the &#x201C;UNICEF Terminology Dictionary&#x201D; for the protection of children regarding matters of a sexual nature [<xref ref-type="bibr" rid="ref9">9</xref>]. To support outputs for younger audiences, the tool&#x2019;s language was informed by resources such as &#x201C;Writing for Young Minds&#x201D; and adapted scientific texts such as those published in Frontiers for Young Minds [<xref ref-type="bibr" rid="ref10">10</xref>]. Additional materials, including guides to science communication [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>] and examples of accessible writing from Brazilian science outreach initiatives such as &#x201C;Profiss&#x00E3;o Biotec&#x201D; [<xref ref-type="bibr" rid="ref13">13</xref>], were used to calibrate tone, clarity, and structure across all outputs.</p><p>The training process emphasized the use of nonstigmatizing and inclusive language, minimization of unnecessary technical jargon, clear structuring of information according to literacy level, and contextual sensitivity to cultural and ethical dimensions of health communication. An additional focus was placed on ensuring equitable representation and fairness in responses across diverse population groups, particularly those historically marginalized in public health communication. The outputs generated by Maria Ci&#x00EA;ncia included short narratives and analogies for children, simplified papers for the general population, technical summaries for health professionals, strategic briefs for health managers, and communication materials designed for social media. Additionally, Maria Ci&#x00EA;ncia includes, in its presentation on the question bar, preconfigured prompts for users with guiding questions for using the chatbot, such as &#x201C;translate this article for the general public,&#x201D; &#x201C;how to explain this concept to children,&#x201D; or &#x201C;create an accessible summary for children.&#x201D; Finally, the assistant was programmed to provide appropriate attribution for all generated materials, including the original scientific source, first author, journal, and year of publication.</p></sec><sec id="s2-5"><title>Generation of Outputs for Evaluation</title><p>Following the configuration of the assistant, we selected 47 peer-reviewed papers (on public health, infectious diseases, and epidemiology) from our institution to serve as the training material. This approach provided the opportunity to invite the original authors of these papers to participate as evaluators in the assessment team. To minimize potential evaluation bias, the chatbot outputs for each paper were generated by external collaborators who were not part of the research group and who did not have a scientific background. Using only the preconfigured guiding questions in the chatbot interface, these collaborators generated 4 outputs per paper, including &#x201C;for children,&#x201D; &#x201C;for health managers,&#x201D; &#x201C;for social media,&#x201D; and &#x201C;for the general public,&#x201D; resulting in a total of 188 outputs. All outputs were generated using a dedicated user account created exclusively for this purpose, to minimize potential bias from prior sessions or unrelated model interactions.</p></sec><sec id="s2-6"><title>Public Evaluation of Chatbot Outputs</title><p>Following the generation of 188 outputs (4 per paper across 47 selected papers), a public evaluation process was conducted to assess the quality and appropriateness of the content produced by Maria Ci&#x00EA;ncia. A standardized online evaluation form was developed for this purpose, structured to allow systematic feedback from diverse audiences. The evaluation process engaged 5 stakeholder groups: authors of the original papers, health professionals and students, social media specialists, members of the general public, and health managers. The evaluation form was disseminated through social media channels to reach a broad and heterogeneous audience. In addition, the original authors of the selected papers were invited to participate in the evaluation. This dual approach enabled the inclusion of both expert and lay perspectives in the assessment process. Participation was voluntary and anonymous.</p><p>Of note, evaluators were allowed to assess materials not exclusively targeted to their own audience profile to capture broader perceptions of clarity, tone, and appropriateness, reflecting real-world dissemination contexts in which health communication materials are often encountered by diverse audiences. In addition, children were not recruited as evaluators in this study, given that research involving minors requires parental permission and age-appropriate assent procedures. Given the exploratory nature of this evaluation and the absence of a child-centered protocol, the assessment of child-focused materials relied on adult evaluators.</p><p>Each participant was asked to assess selected chatbot outputs according to the following criteria: (1) Clarity: Is the text clear and appropriate for the intended audience? (2) Detail: Does the text provide sufficient and relevant information? (3) Language suitability: Is the language appropriate for the literacy level and context of the intended audience? (4) Content quality: Does the text maintain scientific accuracy and communicative effectiveness?</p><p>Participants assigned scores on a scale from 1 (poor) to 5 (excellent) for each criterion. Additionally, the form included an open field for qualitative comments, enabling participants to provide contextual feedback on strengths, limitations, or suggestions for improvement. Qualitative feedback provided by anonymous evaluators was analyzed using thematic categorization. Comments were grouped into four predefined domains: (1) language (clarity, accessibility, and appropriateness of language use); (2) information (accuracy, level of detail, and appropriateness of content for the audience); (3) structure (organization, narrative flow, and format of the material); and (4) proposal (whether the material complied with the intended purpose and target audience). For each domain, comments were further classified as either criticism or praise (for language, information, and structure), or as complies with proposal or does not comply with proposal (for proposal). Each comment was reviewed independently and could be assigned to multiple categories when it addressed more than one thematic domain.</p></sec><sec id="s2-7"><title>Accuracy Evaluation and Comparison With Base GPT</title><p>In addition to the public evaluation of the outputs, a focused accuracy evaluation was conducted to compare the performance of Maria Ci&#x00EA;ncia with that of the base GPT-4.5 (OpenAI) model. This comparison aimed to assess whether the custom configuration of Maria Ci&#x00EA;ncia, which incorporates training on inclusive, nonstigmatizing, and health-appropriate language, enhanced the model&#x2019;s ability to maintain contextual relevance and communicative precision in public health content generation. For this purpose, a selected set of questions previously answered by Maria Ci&#x00EA;ncia was resubmitted to both Maria Ci&#x00EA;ncia and the base GPT-4.5 (without the custom configuration) separately.</p><p>To minimize potential bias from session memory, priming, or model adaptation effects, the evaluations for Maria Ci&#x00EA;ncia and base GPT-4.5 were conducted using separate user accounts. This ensured that the comparative responses were generated independently, reducing the risk of inadvertent learning from previous interactions within the same account. In addition, to assess response stability, the same questions were submitted multiple times in different conversational sequences, allowing us to evaluate whether the models maintained contextual coherence across repeated interactions.</p><p>Responses from both models were evaluated by a team composed of health care professionals and undergraduate students. The evaluation criteria included 4 key dimensions: whether the response accurately established the context of the question; whether contextual coherence was preserved throughout the conversation; whether there was any interruption or drift from the intended context; and, if such drift occurred, whether the model was able to recover and return to the appropriate context. Each dimension was scored on a qualitative scale from 1 (poor) to 5 (excellent). The comparative analysis of results aimed to determine whether Maria Ci&#x00EA;ncia&#x2019;s configuration effectively enhanced contextual accuracy and stability, thus supporting its suitability for reliable and ethically appropriate use in public health communication. The following four dimensions were used to structure the assessment: (1) Establishment of a context: Does the answer fulfill the objective of the question according to the inserted context? (2) Continuity of conversation without specific context of the question: Do the following answers in the conversation with the chatbot lose the context in relation to the question? (3) Interruption of context: Do the answers interrupt or stop fulfilling the context of the question? (4) Return to context: Even after the interruption of the context or digression, is the chatbot able to return to the context of the question?</p><p>The tool operates in various languages, having been tested by the developers at Maria Ci&#x00EA;ncia in Portuguese, English, Spanish, Italian, and French. Moreover, as it is a GPT assistant, the platform supports more than 50 languages [<xref ref-type="bibr" rid="ref14">14</xref>]. Regardless of the language, the generated content follows the same principles of technical configuration, linguistic curation, and thematic supervision. This version preserves the commitment to accessibility, scientific accuracy, and ethical adequacy in knowledge translation, with a view toward application in international and multilingual contexts.</p></sec><sec id="s2-8"><title>Comparative and Readability Analyses</title><p>We conducted additional analysis, including human-written science communication materials and outputs generated by a nonspecialized base GPT-4.5. First, we performed an active search for human-authored news papers and popular science texts related to the peer-reviewed papers previously included in the main evaluation. This search yielded human-written communication materials corresponding to 5 of the originally analyzed scientific papers, all published in open-access media outlets.</p><p>In addition, to include recent and independent examples, we searched Google News (on December 1, 2025) using the query &#x201C;new study in infectious diseases.&#x201D; From the results, we selected the first five news reports that met the following criteria: (1) publication in non&#x2013;university-affiliated media outlets, (2) reference to peer-reviewed scientific papers, and (3) availability of the original scientific papers under open-access conditions.</p><p>For these five additional papers, audience-oriented texts were generated using both Maria Ci&#x00EA;ncia and the base GPT-4.5 model. The same simple prompt was applied to the base model across all cases (&#x201C;transform this article into a text for the general population&#x201D;), allowing a direct comparison between specialized and nonspecialized large language model outputs.</p><p>All materials (Maria Ci&#x00EA;ncia outputs, base GPT-4.5 outputs, and human-written texts) were subjected to a standardized textual readability analysis. This analysis was applied to texts generated for all target audiences and encompassed both the original evaluation set and the additional comparative corpus. Readability metrics included: Flesch reading ease, Gulpease index, Flesch-Kincaid grade level, adapted Gunning fog index, automated readability index (ARI), Coleman-Liau index, letter-to-word ratio, syllable-to-word ratio, words-per-sentence ratio, and proportion of complex words. All readability analyses were conducted using the ALT (analysis of language and text) software, a tool specifically developed for Portuguese-language texts, as described by Moreno et al [<xref ref-type="bibr" rid="ref15">15</xref>] (2023). This approach enabled a quantitative and language-appropriate comparison of textual complexity across human-written materials and AI-generated outputs, independently of subjective evaluator impressions.</p></sec><sec id="s2-9"><title>Data Analysis</title><p>Quantitative data from the evaluation forms were analyzed using descriptive statistics. For each evaluation criterion, means and SDs were calculated. Frequencies and percentages were computed for the classification of evaluator identities and for the distribution of outputs across target audiences. All analyses were conducted using the structured database generated from the stakeholder evaluations. For comparative purposes, we compared each readability metric according to the text generator (Maria Ci&#x00EA;ncia, base GPT-4.5, or human-written).</p></sec><sec id="s2-10"><title>Ethical Considerations</title><p>This study was conducted as a public opinion survey evaluating AI-generated science communication materials. All data were collected through voluntary and anonymous participation, without the collection of identifiable or sensitive personal information, and without any form of intervention or risk to participants. In line with international ethical standards and in accordance with Brazilian Resolution CNS 510/2016, which exempts public opinion research involving nonidentified participants from requiring formal ethics committee approval, this study did not require submission to a research ethics committee.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>Before launching the public evaluation, we first analyzed the process of generating the 188 outputs used for assessment. The generation was conducted by external collaborators with no scientific background, using a dedicated user account created exclusively for this purpose. During this process, important differences were observed between the use of the free version and the paid version (ChatGPT Plus). In the free version, the model frequently (10%) exhibited technical limitations: it would often require questions to be reformulated and occasionally produce incomplete outputs. The average generation time per output in this version was approximately 15.2 (SD 2.3) seconds. After upgrading to the ChatGPT Plus version, performance improved in measurable operational terms. The model produced responses more rapidly and with greater consistency, showing a more direct communication style. In this version, the mean generation time decreased to 8.5 (SD 1.5) seconds, and the incidence of incomplete outputs was eliminated. Despite these differences, the free version remained capable of generating the requested outputs using the predefined prompts provided by Maria Ci&#x00EA;ncia; however, it required longer processing time and occasional manual resubmission of prompts to ensure complete responses.</p></sec><sec id="s3-2"><title>Evaluator Profile and Distribution of Reviewed Outputs</title><p>The evaluation of Maria Ci&#x00EA;ncia involved 121 responses to the form, stratified across 5 distinct groups, each representing a key target audience of the tool. The distribution of respondents was as follows: health professionals and students (56/121, 44.6%), original authors of the scientific papers (33/121, 27.3%), members of the general population (26/121, 21.5%), communication specialists (4/121, 3.3%), and health managers (4/121, 3.3%; <xref ref-type="fig" rid="figure1">Figure 1</xref>). Each evaluator assessed outputs generated for one or more specific target audiences, including &#x201C;for children&#x201D; (n=27), &#x201C;for health managers&#x201D; (n=35), &#x201C;for social media&#x201D; (n=24), and &#x201C;for the general public&#x201D; (n=35). Among these groups, only the original paper authors had prior in-depth knowledge of the scientific content being communicated. Notably, <xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates the distribution of reviewed text types according to identity profile classification, revealing clear patterns in how different stakeholder groups engaged with the audience&#x2010;adapted outputs. Communication professionals and health managers exclusively reviewed solely the texts targeted at their respective profiles (100%), while the other evaluator profiles diversified their reviewed texts. Given the small proportion of the evaluator sample, results related to these subgroups were reported descriptively and were interpreted as exploratory.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Donut charts summarizing the types of audience-adapted texts proportionally reviewed by each participant identity classification. Segment colors represent the percentage of texts tailored for different audiences, including (1) for social media (lavender), (2) for health managers (golden), (3) for children (gray), and (4) for the general public (green). Each donut reflects the distribution of text types reviewed by participants within a specific identity group.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v6i1e78843_fig01.png"/></fig><p>Among the general population evaluators, 62% (16/26) assessed the &#x201C;for the general public&#x201D; texts, while 23% (6/26) provided feedback on &#x201C;for children&#x201D; versions, and 15% (4/26) on &#x201C;for health managers.&#x201D; Notably, none of the general population participants reviewed the &#x201C;for social media&#x201D; outputs. Health professionals and students provided a broader distribution of feedback, with 44% (24/56) evaluating &#x201C;for health managers&#x201D; outputs, 25% (14/56) &#x201C;for the general public,&#x201D; 20% (11/56) &#x201C;for children,&#x201D; and 9% (5/56) &#x201C;for social media.&#x201D; Finally, the paper authors demonstrated a balanced engagement across all 4 categories: 33% (11/33) reviewed &#x201C;for the general public&#x201D; outputs, 30% (10/33) &#x201C;for children,&#x201D; 21% (7/33) &#x201C;for health managers,&#x201D; and 15% (5/33) &#x201C;for social media&#x201D; (<xref ref-type="fig" rid="figure1">Figure 1</xref>). The distribution of respondents and their evaluation profiles across different target audiences is summarized in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Distribution of reviewer identities and rating frequencies by target audience. This table displays the frequency (n) and percentage (%) of reviewers&#x2019; self&#x2010;reported identity classifications and rating scores across 4 different domains, stratified by the number of reviews attributed to each target audience texts. <italic>P</italic> values were calculated using Fisher exact test (for nominal categorical counts) or Kruskal-Wallis tests (for ordinal rating distributions), comparing across the 4 target&#x2010;audience groups. A <italic>P</italic> value &#x003C;.05 denotes a statistically significant difference among audiences.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">For children (n=27)</td><td align="left" valign="bottom">For health managers (n=35)</td><td align="left" valign="bottom">For social media (n=24)</td><td align="left" valign="bottom">For the general public (n=35)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Variable</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Participant classification, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Paper author</td><td align="left" valign="top">10 (37)</td><td align="left" valign="top">7 (20)</td><td align="left" valign="top">11 (45.8)</td><td align="left" valign="top">5 (14.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Communication professional</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">4 (16.7)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;General population (18+ years)</td><td align="left" valign="top">6 (22.2)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">4 (16.7)</td><td align="left" valign="top">16 (45.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Health manager</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">4 (11.4)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Health student or professional</td><td align="left" valign="top">11 (40.7)</td><td align="left" valign="top">24 (68.6)</td><td align="left" valign="top">5 (20.8)</td><td align="left" valign="top">14 (40)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="6">Rating</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Clarity, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.21</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;2</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;3</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">2 (5.7)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;4</td><td align="left" valign="top">4 (14.8)</td><td align="left" valign="top">6 (17.1)</td><td align="left" valign="top">4 (16.7)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;5</td><td align="left" valign="top">23 (85.2)</td><td align="left" valign="top">26 (74.3)</td><td align="left" valign="top">20 (83.3)</td><td align="left" valign="top">34 (97.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Detailing, n (<bold>%</bold>)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.28</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;2</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;3</td><td align="left" valign="top">2 (7.4)</td><td align="left" valign="top">8 (22.9)</td><td align="left" valign="top">4 (16.7)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;4</td><td align="left" valign="top">6 (22.2)</td><td align="left" valign="top">7 (20)</td><td align="left" valign="top">6 (25)</td><td align="left" valign="top">5 (14.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;5</td><td align="left" valign="top">19 (70.4)</td><td align="left" valign="top">19 (54.3)</td><td align="left" valign="top">14 (58.3)</td><td align="left" valign="top">28 (80)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Language adequacy, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.20</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;2</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;3</td><td align="left" valign="top">3 (11.1)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top">2 (8.3)</td><td align="left" valign="top">1 (2.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;4</td><td align="left" valign="top">4 (14.8)</td><td align="left" valign="top">12 (34.3)</td><td align="left" valign="top">2 (8.3)</td><td align="left" valign="top">6 (17.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;5</td><td align="left" valign="top">20 (74.1)</td><td align="left" valign="top">21 (60)</td><td align="left" valign="top">20 (83.3)</td><td align="left" valign="top">28 (80)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Content quality, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.11</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;2</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;3</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">4 (11.4)</td><td align="left" valign="top">1 (4.2)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;4</td><td align="left" valign="top">7 (25.9)</td><td align="left" valign="top">12 (34.3)</td><td align="left" valign="top">7 (29.2)</td><td align="left" valign="top">7 (20)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;&#x2003;5</td><td align="left" valign="top">20 (74.1)</td><td align="left" valign="top">19 (54.3)</td><td align="left" valign="top">16 (66.7)</td><td align="left" valign="top">28 (80)</td><td align="left" valign="top">&#x2003;</td></tr></tbody></table></table-wrap></sec><sec id="s3-3"><title>Public Evaluation of Audience-Adapted Outputs</title><p>Each output was independently evaluated by respondents from multiple stakeholder groups, using 4 evaluation criteria: clarity of the text, level of detail, suitability of language for the intended audience, and overall content quality. Participants rated each criterion on a 5-point scale, with 5 indicating strong agreement regarding the quality or appropriateness of the item assessed. The distribution of evaluator profiles and scoring frequencies is presented in <xref ref-type="table" rid="table1">Table 1</xref>.</p><p>Within this exploratory evaluation, the adapted texts were rated highly across all criteria (<xref ref-type="table" rid="table1">Table 1</xref>). Texts targeting the general public received strong evaluations. Among members of this audience, mean scores were 4.94 (SD 0.25) for clarity, 4.56 (SD 0.89) for detail, 4.62 (SD 0.62) for language suitability, and 4.75 (SD 0.45) for overall quality. Students and health professionals were equally enthusiastic, with scores of 5.00 (SD 0.00) for clarity, 4.86 (SD 0.36) for detailing, 4.93 (SD 0.27) for language, and 4.93 (SD 0.27) for quality. Of note, researchers who authored the original papers were somewhat more critical, assigning 5.00 (SD 0.00) for clarity, 4.80 (SD 0.45) for detail, 4.80 (SD 0.45) for language, and 4.60 (SD 0.55) for overall quality (<xref ref-type="table" rid="table2">Table 2</xref>).</p><p>Similarly, the child-focused outputs were well received. The general public assigned near-perfect ratings of 5.00 (SD 0.00) for clarity, 4.83 (SD 0.41) for detail, 4.83 (SD 0.41) for language suitability, and 4.83 (SD 0.41) for content quality. Students and health professionals also rated the child-focused content highly, with a means of 4.82 (SD 0.40) for clarity, 4.64 (SD 0.67) for detailing, 4.73 (SD 0.65) on language suitability, and 4.73 (SD 0.47) regarding overall quality. Again, the original authors were more reserved, assigning 4.80 (SD 0.42) for clarity, 4.50 (SD 0.71) for detail, 4.40 (SD 0.84) for language, and 4.70 (SD 0.48) for overall quality (<xref ref-type="table" rid="table2">Table 2</xref>).</p><p>Next, the version tailored for health managers was rated lower by managers themselves, who rated it 4.00 (SD 1.41) for clarity, 4.00 (SD 1.41) for detail, 4.00 (SD 0.82) for language suitability, and 4.25 (SD 0.96) for content quality. Students and health professionals provided comparably high scores, with 4.83 (SD 0.48) for clarity, 4.58 (SD 0.72) for detail, 4.62 (SD 0.71) for language suitability, and 4.67 (SD 0.56) for overall quality. Original paper authors again expressed greater variability in their evaluations, especially regarding level of detail, with a mean of 3.29 (SD 0.49), similarly lower ratings were reported for clarity, which was 4.29 (SD 0.76), 4.43 (SD 0.53) for language, and 3.71 (SD 0.49) for content quality (<xref ref-type="table" rid="table2">Table 2</xref>).</p><p>For evaluations aimed at social media texts, all evaluators rated these texts highly. General public reviewers rated this version at 5.00 (SD 0.00) for clarity, 4.75 (SD 0.50) for detail, 4.50 (SD 1.00) for language suitability, and 4.50 (SD 1.00) for overall quality. Students and health professionals similarly gave high scores, 5.00 (SD 0.00) for clarity, 4.40 (SD 0.89) for detail, 4.80 (SD 0.45) for language suitability, and 4.60 (SD 0.55) for content quality. Communication professionals assigned a perfect mean score of 5.00 (SD 0.00) across all 4 criteria. As observed for other target audiences, paper authors provided more conservative ratings, with scores of 4.64 (SD 0.50) for clarity, 4.09 (SD 0.83) for detail, 4.73 (SD 0.65) for language suitability, and 4.55 (SD 0.52) for overall quality (<xref ref-type="table" rid="table2">Table 2</xref>).</p><p>Taken together, within this exploratory evaluation, audience-adapted texts received high mean scores across all 4 assessed criteria, regardless of the target audience. Notably, texts adapted for children and for the general population received particularly high ratings across all dimensions, with most mean scores approaching the maximum value of 5. Health students or professionals, communication professionals, and the general adult population tended to assign higher scores overall, while health managers and paper authors demonstrated greater variability in their assessments, especially for detailing of texts targeting health managers or social media platforms (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Among all groups, paper authors exhibited the greatest variability in their evaluations. These patterns indicate broad perceived acceptability of the materials in this sample, with subtle differences in perceived quality depending on the evaluator profile (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Mean evaluation scores of audience-adapted texts by criterion and evaluator population. Bubble plot presenting the mean scores for each evaluation criterion, clarity, detailing, language adequacy, and content quality, across four types of audience-adapted texts: (A) for children, (B) for the general population, (C) for health managers, and (D) for social media. Each colored bubble represents a different population of evaluators, as indicated in the legend on the right. The size of each bubble is proportional to the number of respondents from that population who rated the corresponding question for each text type.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v6i1e78843_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Proportional contributions of evaluation domains to each participant&#x2019;s total score, grouped by reviewer identity. A 100% stacked bar chart in which each vertical bar represents an individual participant&#x2019;s normalized total evaluation score (scaled to 100%), with participants organized along the x-axis and grouped by self-reported identity: paper author, communication professional, general population (18+ years), health manager, and health student or professional. Within each bar, colored segments depict the relative weight of each of the 4 evaluation categories, quality (light blue), language (teal), detailing (gold), and clarity (maroon), in that participant&#x2019;s overall total rating (sum of individual 1-5 domain scores). The y-axis indicates the percentage contribution of each category to the participant&#x2019;s total score.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="infodemiology_v6i1e78843_fig03.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Average (SD) evaluation scores by audience and stakeholder group for each adapted output. This table presents the central tendency and dispersion (mean, SD) of four evaluation domains: (1) clarity, (2) detailing, (3) language suitability, and (4) content quality, across four target&#x2010;audience contexts (&#x201C;for children,&#x201D; &#x201C;for health managers,&#x201D; &#x201C;for social media,&#x201D; and &#x201C;for the general public&#x201D;). Within each context, scores are shown separately for each evaluator subgroup (authors, general public, students or health professionals, health managers, and communication professionals). All ratings were provided on a 5&#x2010;point scale ranging from 1&#x2010;5.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Target audience and evaluator</td><td align="left" valign="bottom">Clarity</td><td align="left" valign="bottom">Detailing</td><td align="left" valign="bottom">Language suitability</td><td align="left" valign="bottom">Content quality</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">For the general public, mean (SD)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Authors</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">4.80 (0.45)</td><td align="left" valign="top">4.80 (0.45)</td><td align="left" valign="top">4.60 (0.55)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>General public</td><td align="left" valign="top">4.94 (0.25)</td><td align="left" valign="top">4.56 (0.89)</td><td align="left" valign="top">4.62 (0.62)</td><td align="left" valign="top">4.75 (0.45)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Students or health professionals</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">4.86 (0.36)</td><td align="left" valign="top">4.93 (0.27)</td><td align="left" valign="top">4.93 (0.27)</td></tr><tr><td align="left" valign="top" colspan="5">For children, mean (SD)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Authors</td><td align="left" valign="top">4.80 (0.42)</td><td align="left" valign="top">4.50 (0.71)</td><td align="left" valign="top">4.40 (0.84)</td><td align="left" valign="top">4.70 (0.48)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>General public</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">4.83 (0.41)</td><td align="left" valign="top">4.83 (0.41)</td><td align="left" valign="top">4.83 (0.41)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Students or health professionals</td><td align="left" valign="top">4.82 (0.40)</td><td align="left" valign="top">4.64 (0.67)</td><td align="left" valign="top">4.73 (0.65)</td><td align="left" valign="top">4.73 (0.47)</td></tr><tr><td align="left" valign="top" colspan="5">For health managers, mean (SD)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Authors</td><td align="left" valign="top">4.29 (0.76)</td><td align="left" valign="top">3.29 (0.49)</td><td align="left" valign="top">4.43 (0.53)</td><td align="left" valign="top">3.71 (0.49)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Students or health professionals</td><td align="left" valign="top">4.83 (0.48)</td><td align="left" valign="top">4.58 (0.72)</td><td align="left" valign="top">4.62 (0.71)</td><td align="left" valign="top">4.67 (0.56)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Health managers</td><td align="left" valign="top">4.00 (1.41)</td><td align="left" valign="top">4.00 (1.41)</td><td align="left" valign="top">4.00 (0.82)</td><td align="left" valign="top">4.25 (0.96)</td></tr><tr><td align="left" valign="top" colspan="5">For social media, mean (SD)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Authors</td><td align="left" valign="top">4.64 (0.50)</td><td align="left" valign="top">4.09 (0.83)</td><td align="left" valign="top">4.73 (0.65)</td><td align="left" valign="top">4.55 (0.52)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>General public</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">4.75 (0.50)</td><td align="left" valign="top">4.50 (1.00)</td><td align="left" valign="top">4.50 (1.00)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Students or health professionals</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">4.40 (0.89)</td><td align="left" valign="top">4.80 (0.45)</td><td align="left" valign="top">4.60 (0.55)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Communication professionals</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">5.00 (0.00)</td><td align="left" valign="top">5.00 (0.00)</td></tr></tbody></table></table-wrap><p>In addition to quantitative ratings, anonymous evaluators were invited to provide open-ended comments on the chatbot-generated materials. A total of 68 comments were collected, distributed across the evaluated target audiences: &#x201C;for children&#x201D; (n=14), &#x201C;for the general public&#x201D; (n=27), &#x201C;for health managers&#x201D; (n=11), and &#x201C;for social media&#x201D; (n=16; <xref ref-type="table" rid="table3">Table 3</xref>). Across all categories, the overall tone of the comments was positive and constructive. For children&#x2019;s materials, praise regarding language was the most frequent (8/14, 57.1%), while 42.9% (6/14) of comments did not address language. Information praise (4/14, 28.6%) and information criticism (4/14, 28.6%) were also observed. Only 7.1% (1/14) of comments suggested the material did not fully comply with its intended proposal. For health manager materials, comments were more evenly distributed: information criticism (4/11, 36.3%), language praise (4/11, 36.3%), and proposal compliance (9/11, 81.8%) were most common, though 18.2% (2/11) indicated noncompliance with the proposal. For social media materials, the highest frequency of feedback related to information criticism (6/16, 37.5%) and structure criticism (4/16, 25%), reflecting the platform-specific communication challenges. A majority (13/16, 81.3%) of comments judged the materials as compliant with the intended proposal. For general public materials, language praise was dominant (18/27, 66.7%), with a smaller proportion of comments addressing information (only 29.6% provided any information-related feedback). Most comments (23/27, 85.2%) indicated that the outputs complied with the intended proposal. Across all targets, the high proportion of proposal compliance comments indicates strong overall alignment between the outputs and their target audiences. A full compilation of the anonymous comments is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Distribution of types of comments by target audience. This table displays the frequency (n) and percentage (%). Comments were categorized into 4 domains: language, information, structure, and proposal. For each domain, comments were classified as criticism, praise, or not applicable (for language, information, and structure), or as complies with proposal or does not comply with proposal (for proposal). Comments could be assigned to multiple domains and categories.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">For children<break/>(n=14)</td><td align="left" valign="bottom">For health managers<break/>(n=11)</td><td align="left" valign="bottom">For social media<break/>(n=16)</td><td align="left" valign="bottom">For the general public<break/>(n=27)</td></tr></thead><tbody><tr><td align="left" valign="top">Language, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Criticism</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (9.1)</td><td align="left" valign="top">2 (12.5)</td><td align="left" valign="top">2 (7.4)</td></tr><tr><td align="left" valign="top">&#x2003;Praise</td><td align="left" valign="top">8 (57.1)</td><td align="left" valign="top">4 (36.3)</td><td align="left" valign="top">5 (31.2)</td><td align="left" valign="top">18 (66.7)</td></tr><tr><td align="left" valign="top">&#x2003;Not applicable</td><td align="left" valign="top">6 (42.9)</td><td align="left" valign="top">6 (54.6)</td><td align="left" valign="top">9 (56.3)</td><td align="left" valign="top">7 (25.9)</td></tr><tr><td align="left" valign="top">Information, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Criticism</td><td align="left" valign="top">4 (28.6)</td><td align="left" valign="top">4 (36.3)</td><td align="left" valign="top">6 (37.5)</td><td align="left" valign="top">5 (18.5)</td></tr><tr><td align="left" valign="top">&#x2003;Praise</td><td align="left" valign="top">4 (28.6)</td><td align="left" valign="top">2 (18.2)</td><td align="left" valign="top">1 (6.2)</td><td align="left" valign="top">3 (11.1)</td></tr><tr><td align="left" valign="top">&#x2003;Not applicable</td><td align="left" valign="top">6 (42.9)</td><td align="left" valign="top">5 (45.5)</td><td align="left" valign="top">9 (56.3)</td><td align="left" valign="top">19 (70.4)</td></tr><tr><td align="left" valign="top">Structure, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Criticism</td><td align="left" valign="top">3 (21.4)</td><td align="left" valign="top">2 (18.2)</td><td align="left" valign="top">4 (25)</td><td align="left" valign="top">2 (7.4)</td></tr><tr><td align="left" valign="top">&#x2003;Praise</td><td align="left" valign="top">3 (21.4)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Not applicable</td><td align="left" valign="top">8 (57.1)</td><td align="left" valign="top">9 (81.8)</td><td align="left" valign="top">11 (68.8)</td><td align="left" valign="top">25 (92.6)</td></tr><tr><td align="left" valign="top">Proposal, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Does not comply with the proposal</td><td align="left" valign="top">1 (7.1)</td><td align="left" valign="top">2 (18.2)</td><td align="left" valign="top">3 (18.7)</td><td align="left" valign="top">4 (14.8)</td></tr><tr><td align="left" valign="top">&#x2003;Complies with the proposal</td><td align="left" valign="top">13 (92.9)</td><td align="left" valign="top">9 (81.8)</td><td align="left" valign="top">13 (81.3)</td><td align="left" valign="top">23 (85.2)</td></tr></tbody></table></table-wrap></sec><sec id="s3-4"><title>Comparative Accuracy and Context Stability Evaluation</title><p>A detailed comparison between Maria Ci&#x00EA;ncia and the base GPT-4.5 model was conducted across 4 conversational criteria: establishment of context, continuity of conversation, resilience to interruption, and return to context, stratified by target audience (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). For Maria Ci&#x00EA;ncia, mean scores were high across all target audiences and criteria. For the general public, Maria Ci&#x00EA;ncia achieved perfect continuity of conversation (5.00, SD 0.00) and high stability across all other dimensions (establishment of context: 4.75, SD 0.50; interruption of context: 4.75, SD 0.50; and return to context: 4.75, SD 0.50). In comparison, the base GPT-4.5 model exhibited lower mean scores across several criteria.</p><p>For children, Maria Ci&#x00EA;ncia again showed higher mean scores, with perfect scores for interruption of context (5.00, SD 0.00) and strong scores across other criteria (establishment of context: 4.66, SD 0.58; continuity: 4.66, SD 0.58; and return to context: 4.66, SD 0.58). The base GPT-4.5 model showed substantially lower performance in this category, particularly in continuity (3.00, SD 0.82) and establishment of context (3.25, SD 0.50), indicating challenges in maintaining audience-appropriate conversation flow for younger users.</p><p>For social media outputs, scores remained high, with means of 4.50 (SD 0.58) for establishment of context and continuity of conversation, and 5.00 (SD 0.00) for criterion resilience to interruption. In contrast, the base GPT-4.5 model exhibited greater variability, particularly in outputs for children and health managers. For children, mean scores were notably lower in the establishment of context (3.25, SD 0.96), continuity of conversation (3.00, SD 0.82), and resilience to interruption (3.00, SD 0.82), highlighting difficulties in maintaining and recovering conversational context. For health managers, while context establishment remained high (4.75, SD 0.50), performance dropped in criteria resilience to interruption (3.75, SD 0.96) and continuity of conversation (4.25, SD 0.50). Across all targets, the base GPT-4.5 model showed more frequent context drift and reduced continuity compared to Maria Ci&#x00EA;ncia (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-5"><title>Readability Evaluation</title><p>Readability metrics derived from the ALT framework revealed significant differences between texts generated by Maria Ci&#x00EA;ncia and those generated by the base GPT-4.5 model. For materials designed for children, the overall grade level was higher for Maria Ci&#x00EA;ncia outputs compared to base GPT-4.5 (MC: 8.23, SD 0.96 vs GPT: 7.56, SD 1.03; <italic>P</italic>=.002). While all texts from both generators were classified as having high legibility, differences emerged across several quantitative readability indices. Maria Ci&#x00EA;ncia texts showed lower Flesch reading ease scores (MC: 67.1, SD 5.51 vs GPT: 71.3, SD 5.80; <italic>P</italic>=.001) and higher Flesch-Kincaid grade levels (MC: 7.58, SD 0.98 vs GPT: 6.70, SD 0.98; <italic>P</italic>&#x003C;.001), indicating increased textual complexity. Similar patterns were observed for the adjusted Gunning fog index (<italic>P</italic>&#x003C;.001), the ARI (<italic>P</italic>=.004), the number of words per sentence (<italic>P</italic>&#x003C;.001), and several syllables per word (<italic>P</italic>=.002). No statistically significant differences were observed between generators for the Coleman-Liau index, letters per word, or proportion of complex words (<xref ref-type="table" rid="table4">Table 4</xref>).</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Readability analysis of texts. This table presents the central tendency and dispersion (mean, SD) of readability metrics, as well as the frequency (n) and percentage (%) for categorical variables.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">GPT base</td><td align="left" valign="bottom">Maria Ci&#x00EA;ncia</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">For children</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Overall grade level, mean (SD)</td><td align="left" valign="top">7.56 (1.03)</td><td align="left" valign="top">8.23 (0.96)</td><td align="left" valign="top">.002</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recommended age group (year), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.08</td></tr><tr><td align="left" valign="top">&#x2003;11&#x2010;14</td><td align="left" valign="top">39 (83)</td><td align="left" valign="top">30 (63.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;15&#x2010;18</td><td align="left" valign="top">8 (17)</td><td align="left" valign="top">16 (36.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Legibility result, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;High</td><td align="left" valign="top">47 (100)</td><td align="left" valign="top">47 (100)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch reading ease, mean (SD)</td><td align="left" valign="top">71.3 (5.80)</td><td align="left" valign="top">67.1 (5.51)</td><td align="left" valign="top">.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gulpease index, mean (SD)</td><td align="left" valign="top">69.6 (4.26)</td><td align="left" valign="top">1104 (6883)</td><td align="left" valign="top">.32</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch-Kincaid grade level, mean (SD)</td><td align="left" valign="top">6.70 (0.98)</td><td align="left" valign="top">7.58 (0.98)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Adjusted Gunning fog index, mean (SD)</td><td align="left" valign="top">8.12 (0.85)</td><td align="left" valign="top">8.85 (0.79)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Automated readability index, mean (SD)</td><td align="left" valign="top">6.34 (1.24)</td><td align="left" valign="top">7.09 (1.18)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Coleman-Liau index, mean (SD)</td><td align="left" valign="top">9.23 (1.21)</td><td align="left" valign="top">9.64 (1.05)</td><td align="left" valign="top">.09</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Letters per word, mean (SD)</td><td align="left" valign="top">4.65 (0.21)</td><td align="left" valign="top">4.68 (0.20)</td><td align="left" valign="top">.51</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Syllables per word, mean (SD)</td><td align="left" valign="top">1.98 (0.08)</td><td align="left" valign="top">2.03 (0.07)</td><td align="left" valign="top">.002</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Words per sentence, mean (SD)</td><td align="left" valign="top">11.2 (1.44)</td><td align="left" valign="top">12.5 (1.45)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Complex words (%), mean (SD)</td><td align="left" valign="top">13.7 (3.44)</td><td align="left" valign="top">14.6 (2.44)</td><td align="left" valign="top">.15</td></tr><tr><td align="left" valign="top">For the health manager</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Overall grade level, mean (SD)</td><td align="left" valign="top">13.7 (1.70)</td><td align="left" valign="top">14.4 (2.05)</td><td align="left" valign="top">.11</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recommended age group (year), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.13</td></tr><tr><td align="left" valign="top">&#x2003;15&#x2010;18</td><td align="left" valign="top">10 (21.3)</td><td align="left" valign="top">5 (10.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Can be easily understood by university students</td><td align="left" valign="top">30 (63.8)</td><td align="left" valign="top">35 (74.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;For people with a college degree</td><td align="left" valign="top">7 (14.9)</td><td align="left" valign="top">3 (6.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Extremely difficult text</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">4 (8.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Legibility result, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.32</td></tr><tr><td align="left" valign="top">&#x2003;High</td><td align="left" valign="top">10 (21.3)</td><td align="left" valign="top">5 (10.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Medium</td><td align="left" valign="top">34 (72.3)</td><td align="left" valign="top">37 (78.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Low</td><td align="left" valign="top">3 (6.4)</td><td align="left" valign="top">5 (10.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch reading ease, mean (SD)</td><td align="left" valign="top">27.8 (8.13)</td><td align="left" valign="top">32.6 (8.61)</td><td align="left" valign="top">.008</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gulpease index, mean (SD)</td><td align="left" valign="top">53.7 (6.72)</td><td align="left" valign="top">50.0 (4.36)</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch-Kincaid grade level, mean (SD)</td><td align="left" valign="top">13.5 (1.81)</td><td align="left" valign="top">14.0 (2.22)</td><td align="left" valign="top">.24</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Adjusted Gunning fog index, mean (SD)</td><td align="left" valign="top">11.5 (2.20)</td><td align="left" valign="top">14.0 (2.81)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Automated readability index, mean (SD)</td><td align="left" valign="top">13.3 (2.06)</td><td align="left" valign="top">14.2 (2.64)</td><td align="left" valign="top">.08</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Coleman-Liau index, mean (SD)</td><td align="left" valign="top">16.4 (1.21)</td><td align="left" valign="top">15.0 (1.11)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Letters per word, mean (SD)</td><td align="left" valign="top">5.95 (0.21)</td><td align="left" valign="top">5.59 (0.22)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Syllables per word, mean (SD)</td><td align="left" valign="top">2.56 (0.10)</td><td align="left" valign="top">2.42 (0.11)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Words per sentence, mean (SD)</td><td align="left" valign="top">13.5 (4.17)</td><td align="left" valign="top">19.2 (6.09)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Complex words (%), mean (SD)</td><td align="left" valign="top">25.9 (3.44)</td><td align="left" valign="top">23.9 (3.08)</td><td align="left" valign="top">.006</td></tr><tr><td align="left" valign="top">For social media</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Overall grade level, mean (SD)</td><td align="left" valign="top">8.89 (2.05)</td><td align="left" valign="top">11.2 (1.59)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recommended age group (years), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;11&#x2010;14</td><td align="left" valign="top">20 (42.6)</td><td align="left" valign="top">1 (2.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;15&#x2010;18</td><td align="left" valign="top">24 (51)</td><td align="left" valign="top">40 (85.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Can be easily understood by university students</td><td align="left" valign="top">3 (6.4)</td><td align="left" valign="top">6 (12.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Legibility result, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.22</td></tr><tr><td align="left" valign="top">&#x2003;High</td><td align="left" valign="top">43 (91.5)</td><td align="left" valign="top">39 (83)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Medium</td><td align="left" valign="top">4 (8.5)</td><td align="left" valign="top">8 (17)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch reading ease, mean (SD)</td><td align="left" valign="top">65.5 (12.8)</td><td align="left" valign="top">50.7 (8.95)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gulpease index, mean (SD)</td><td align="left" valign="top">64.4 (6.92)</td><td align="left" valign="top">57.1 (4.27)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch-Kincaid grade level, mean (SD)</td><td align="left" valign="top">8.02 (2.26)</td><td align="left" valign="top">10.7 (1.75)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Adjusted Gunning fog index, mean (SD)</td><td align="left" valign="top">9.49 (1.72)</td><td align="left" valign="top">10.9 (1.95)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Automated readability index, mean (SD)</td><td align="left" valign="top">7.91 (2.52)</td><td align="left" valign="top">10.7 (1.97)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Coleman-Liau index, mean (SD)</td><td align="left" valign="top">10.1 (2.20)</td><td align="left" valign="top">12.4 (1.50)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Letters per word, mean (SD)</td><td align="left" valign="top">4.76 (0.38)</td><td align="left" valign="top">5.14 (0.29)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Syllables per word, mean (SD)</td><td align="left" valign="top">2.03 (0.16)</td><td align="left" valign="top">2.20 (0.12)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Words per sentence, mean (SD)</td><td align="left" valign="top">13.5 (2.97)</td><td align="left" valign="top">16.0 (4.10)</td><td align="left" valign="top">.002</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Complex words (%), mean (SD)</td><td align="left" valign="top">15 (4.83)</td><td align="left" valign="top">16.2 (3.12)</td><td align="left" valign="top">.17</td></tr><tr><td align="left" valign="top">For the general public</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Overall grade level, mean (SD)</td><td align="left" valign="top">10.5 (1.22)</td><td align="left" valign="top">9.96 (1.00)</td><td align="left" valign="top">.026</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recommended age group (year), n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.52</td></tr><tr><td align="left" valign="top">&#x2003;11&#x2010;14</td><td align="left" valign="top">3 (6.4)</td><td align="left" valign="top">2 (4.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;15&#x2010;18</td><td align="left" valign="top">41 (87.2)</td><td align="left" valign="top">44 (93.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Can be easily understood by university students</td><td align="left" valign="top">3 (6.4)</td><td align="left" valign="top">1 (2.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Legibility result, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.31</td></tr><tr><td align="left" valign="top">&#x2003;High</td><td align="left" valign="top">44 (93.6)</td><td align="left" valign="top">46 (97.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Medium</td><td align="left" valign="top">3 (6.4)</td><td align="left" valign="top">1 (2.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch reading ease, mean (SD)</td><td align="left" valign="top">53.1 (7.35)</td><td align="left" valign="top">58.7 (5.87)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gulpease index, mean (SD)</td><td align="left" valign="top">59.5 (4.05)</td><td align="left" valign="top">60.5 (3.08)</td><td align="left" valign="top">.21</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Flesch-Kincaid grade level, mean (SD)</td><td align="left" valign="top">9.92 (1.24)</td><td align="left" valign="top">9.33 (1.05)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Adjusted Gunning fog index, mean (SD)</td><td align="left" valign="top">9.96 (1.23)</td><td align="left" valign="top">10.4 (1.11)</td><td align="left" valign="top">.07</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Automated readability index, mean (SD)</td><td align="left" valign="top">9.83 (1.47)</td><td align="left" valign="top">9.02 (1.21)</td><td align="left" valign="top">.06</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Coleman-Liau index, mean (SD)</td><td align="left" valign="top">12.2 (1.39)</td><td align="left" valign="top">10.9 (1.00)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Letters per word, mean (SD)</td><td align="left" valign="top">5.14 (0.25)</td><td align="left" valign="top">4.86 (0.18)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Syllables per word, mean (SD)</td><td align="left" valign="top">2.20 (0.11)</td><td align="left" valign="top">2.10 (0.08)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Words per sentence, mean (SD)</td><td align="left" valign="top">14.0 (2.38)</td><td align="left" valign="top">15.1 (1.83)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Complex words (%), mean (SD)</td><td align="left" valign="top">16.2 (4.51)</td><td align="left" valign="top">15.8 (3.06)</td><td align="left" valign="top">.62</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>Not available.</p></fn></table-wrap-foot></table-wrap><p>The readability analyses of texts generated for health managers revealed overall comparable patterns between Maria Ci&#x00EA;ncia and the base GPT-4.5 model, with few statistically significant differences across metrics. The overall grade level did not differ significantly between generators (<italic>P</italic>=.11), as well as the classification by recommended audience level (<italic>P</italic>=.13), and the overall legibility categories (<italic>P</italic>=.32). Despite these similarities, Maria Ci&#x00EA;ncia texts exhibited higher Flesch reading ease scores compared to base GPT-4.5 (MC: 32.6, SD 8.61 vs GPT: 27.8, SD 8.13; <italic>P</italic>=.008), higher Gunning fog index (MC: 14.0, SD 2.81 vs GPT: 11.5, SD 2.20; <italic>P</italic>&#x003C;.001), alongside lower Gulpease index values (MC: 50.0, SD 4.36 vs GPT: 53.7, SD 6.72; <italic>P</italic>=.003), if compared to base GPT 4.5 model (<xref ref-type="table" rid="table4">Table 4</xref>). At the lexical and syntactic levels, Maria Ci&#x00EA;ncia texts contained fewer letters per word (<italic>P</italic>&#x003C;.001) and fewer syllables per word (<italic>P</italic>&#x003C;.001), but substantially longer sentences (<italic>P</italic>&#x003C;.001). The proportion of complex words was slightly lower in Maria Ci&#x00EA;ncia outputs (23.9%, SD 3.08% vs 25.9%, SD 3.44%; <italic>P</italic>=.006; <xref ref-type="table" rid="table4">Table 4</xref>).</p><p>For materials intended for social media, Maria Ci&#x00EA;ncia outputs exhibited a substantially higher overall grade level compared to base GPT-4.5 (MC: 11.2, SD 1.59 vs GPT: 8.89, SD 2.05; <italic>P</italic>&#x003C;.001). Consistent with this pattern, having high legibility across multiple recommended age group classifications differed significantly between generators (<italic>P</italic>&#x003C;.001). While base GPT-4.5 outputs were more frequently classified as suitable for younger adolescents (11&#x2010;14 y), the majority of Maria Ci&#x00EA;ncia&#x2019;s texts were classified as appropriate for older adolescents (15&#x2010;18 y). Despite these differences in textual complexity, overall legibility categories (high vs medium) were comparable between generators (<italic>P</italic>=.22), with most texts in both groups classified as having high legibility. Across multiple readability indices, Maria Ci&#x00EA;ncia&#x2019;s texts consistently demonstrated increased linguistic complexity. These outputs showed lower Flesch reading ease scores (MC: 50.7, SD 8.95 vs GPT: 65.5, SD 12.8; <italic>P</italic>&#x003C;.001) and lower Gulpease index values (MC: 57.1, SD 4.27 vs GPT: 64.4, SD 6.92; <italic>P</italic>&#x003C;.001), alongside higher Flesch-Kincaid grade levels (MC: 10.7 (SD 1.75 vs GPT: 8.02, SD 2.26; <italic>P</italic>&#x003C;.001). Similar trends were observed for the adjusted Gunning fog index, ARI, and Coleman-Liau index (<italic>P</italic>&#x003C;.001). At the lexical and syntactic levels, Maria Ci&#x00EA;ncia outputs contained longer words, reflected by higher letters-per-word and syllables-per-word ratios (both <italic>P</italic>&#x003C;.001), as well as longer sentences (<italic>P</italic>=.002). The proportion of complex words did not differ significantly between generators (<xref ref-type="table" rid="table4">Table 4</xref>).</p><p>Readability analyses indicated modest but statistically significant differences between texts generated by Maria Ci&#x00EA;ncia and those generated by the base GPT-4.5 model for materials aimed at the general population. Maria Ci&#x00EA;ncia outputs exhibited a slightly lower overall grade level compared to base GPT-4.5 (MC: 9.96, SD 1.00 vs GPT: 10.5, SD 1.22; <italic>P</italic>=.03). Recommended age group classifications were similar between generators (<italic>P</italic>=.52), with the majority of texts in both groups classified as suitable for adolescents aged 15&#x2010;18 years. Overall legibility categories (high vs medium) were also comparable (<italic>P</italic>=.31), with most texts classified as having high legibility. Several readability indices suggested improved linguistic accessibility in Maria Ci&#x00EA;ncia outputs. These texts showed higher Flesch Reading Ease scores (MC: 58.7, SD 5.87 vs GPT: 53.1, SD 7.35; <italic>P</italic>&#x003C;.001) and lower Flesch&#x2013;Kincaid Grade Levels (MC: 9.33, SD 1.05 vs GPT: 9.92, SD 1.24; <italic>P</italic>=.02). The Coleman-Liau Index was also lower for Maria Ci&#x00EA;ncia texts (MC: 10.9, SD 1.00 vs GPT: 12.2, SD 1.39; <italic>P</italic>&#x003C;.001), indicating reduced lexical complexity. At the word level, Maria Ci&#x00EA;ncia outputs contained fewer letters per word (MC: 4.86, SD 0.18 vs GPT: 5.14, SD 0.25; <italic>P</italic>&#x003C;.001) and fewer syllables per word (MC: 2.10, SD 0.08 vs GPT: 2.20, SD 0.11; <italic>P</italic>&#x003C;.001). In contrast, Maria Ci&#x00EA;ncia texts exhibited a slightly higher number of words per sentence compared to base GPT-4.5 outputs (MC: 15.1, SD 1.83 vs 14.0, SD GPT: 2.38; <italic>P</italic>=.02). No statistically significant differences were observed between generators in the proportion of complex words (<xref ref-type="table" rid="table4">Table 4</xref>).</p><p>When directly compared with human-written texts, both base GPT-4.5 and Maria Ci&#x00EA;ncia showed systematic and statistically significant differences across nearly all readability metrics. Human texts consistently exhibited higher overall grade levels (15.6, SD 1.96) than base GPT-4.5 (11.0, SD 1.15) and Maria Ci&#x00EA;ncia (9.7, SD 0.67), indicating substantially greater linguistic complexity. This pattern was reinforced by multiple indices: human abstracts had lower Flesch reading ease scores and higher Flesch-Kincaid, Gunning fog, ARI, and Coleman-Liau indices, alongside longer sentences and a higher proportion of complex words (all with <italic>P</italic>&#x003C;.01, <xref ref-type="table" rid="table5">Table 5</xref>). In contrast, both Maria Ci&#x00EA;ncia and base GPT-4.5 generated texts that were easier to read, shorter at the sentence level, and lexically simpler. Importantly, while both systems differed from human writing in the same direction, Maria Ci&#x00EA;ncia outputs tended to be consistently simpler than base GPT-4.5 across most metrics, including reading ease, grade level, sentence length, and lexical density (<xref ref-type="table" rid="table5">Table 5</xref>).</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Differences between Maria Ci&#x00EA;ncia, base GPT 4.5, and human-written texts. This table presents the central tendency and dispersion (mean, SD) of readability metrics, as well as the frequency (n) and percentage (%) for categorical variables.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">GPT base&#x00B0;</td><td align="left" valign="bottom">Maria Ci&#x00EA;ncia</td><td align="left" valign="bottom">Human</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Overall grade level, mean (SD)</td><td align="left" valign="top">11.0 (1.15)</td><td align="left" valign="top">9.70 (0.67)</td><td align="left" valign="top">15.6 (1.96)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Recommended age group, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>11&#x2010;14 year</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (10)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>15&#x2010;18 year</td><td align="left" valign="top">9 (90)</td><td align="left" valign="top">9 (90)</td><td align="left" valign="top">1 (10)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Can be easily understood by university students</td><td align="left" valign="top">1 (10)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">3 (30)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>For people with a college degree</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">6 (60)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Legibility result, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>High</td><td align="left" valign="top">9 (90)</td><td align="left" valign="top">10 (100)</td><td align="left" valign="top">1 (10)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Medium</td><td align="left" valign="top">1 (10)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">5 (50)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Low</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">4 (40)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Flesch reading ease, mean (SD)</td><td align="left" valign="top">50.6 (6.93)</td><td align="left" valign="top">58.7 (5.81)</td><td align="left" valign="top">32.4 (10.5)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Gulpease index, mean (SD)</td><td align="left" valign="top">57.8 (3.52)</td><td align="left" valign="top">60.9 (2.84)</td><td align="left" valign="top">47.1 (3.53)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Flesch-Kincaid grade level, mean (SD)</td><td align="left" valign="top">10.6 (1.10)</td><td align="left" valign="top">9.10 (0.77)</td><td align="left" valign="top">15.4 (1.92)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Adjusted Gunning fog index, mean (SD)</td><td align="left" valign="top">11.1 (1.43)</td><td align="left" valign="top">10.1 (0.88)</td><td align="left" valign="top">16.6 (2.06)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Automated readability index, mean (SD)</td><td align="left" valign="top">10.4 (1.32)</td><td align="left" valign="top">8.91 (0.95)</td><td align="left" valign="top">16.1 (2.10)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Coleman-Liau index, mean (SD)</td><td align="left" valign="top">12.3 (1.48)</td><td align="left" valign="top">10.9 (0.86)</td><td align="left" valign="top">14.2 (1.58)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Letters per word, mean (SD)</td><td align="left" valign="top">5.14 (0.28)</td><td align="left" valign="top">4.90 (0.17)</td><td align="left" valign="top">5.35 (0.28)</td><td align="left" valign="top">.002</td></tr><tr><td align="left" valign="top">Syllables per word, mean (SD)</td><td align="left" valign="top">2.20 (0.11)</td><td align="left" valign="top">2.08 (0.08)</td><td align="left" valign="top">2.32 (0.11)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Words per sentence, mean (SD)</td><td align="left" valign="top">15.5 (3.18)</td><td align="left" valign="top">14.6 (1.64)</td><td align="left" valign="top">26.0 (3.29)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Complex words (%), mean (SD)</td><td align="left" valign="top">18.6 (3.94)</td><td align="left" valign="top">15.6 (2.67)</td><td align="left" valign="top">20.6 (4.40)</td><td align="left" valign="top">.02</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>This study provides exploratory evidence that Maria Ci&#x00EA;ncia is capable of producing audience-adapted science communication materials that are perceived as clear, accessible, and linguistically appropriate across a range of stakeholders. Materials tailored for children and the general public were especially well received, while outputs for health managers showed greater variability, reflecting the distinct informational demands of this audience. The more critical feedback from original paper authors highlights the inherent challenge of balancing scientific precision with public accessibility.</p><p>Qualitative feedback from anonymous evaluators reinforced these trends, highlighting the clarity and perceived usefulness of the materials and offering constructive suggestions to further adapt tone and terminology for specific audiences. These results are encouraging, particularly in light of the urgent need to address health misinformation, which continues to erode public trust in science, hinder the implementation of health policies, and contribute to adverse health outcomes [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. The COVID-19 pandemic brought the urgency of this issue into sharp focus, with widespread infodemics interfering with disease prevention efforts and amplifying avoidable harm [<xref ref-type="bibr" rid="ref2">2</xref>], emphasizing the importance of tools that support effective science communication.</p><p>By enabling the production of trusted, audience-specific materials, Maria Ci&#x00EA;ncia can complement existing strategies for combating misinformation, which traditionally rely on reactive fact-checking or broad public health campaigns [<xref ref-type="bibr" rid="ref16">16</xref>]. Within the scope of this evaluation, Maria Ci&#x00EA;ncia demonstrated superior conversational stability and contextual accuracy, particularly for sensitive audiences such as children, critical for fostering health literacy from an early age. Furthermore, previous studies have shown that GPT-based assistants specifically trained or configured with domain-relevant and ethically curated materials achieve higher performance and contribute to greater user trust and acceptance of the platform in public health and educational contexts [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. The approach adopted by Maria Ci&#x00EA;ncia, combining prompt engineering with thematic supervision, is consistent with these findings and reinforces the value of domain-specific configuration for science communication tools.</p><p>Beyond model performance, Maria Ci&#x00EA;ncia was designed to reduce practical barriers that limit researchers&#x2019; engagement with public audiences. Despite growing recognition of science communication as a core responsibility, academic structures still prioritize publication in peer-reviewed journals over community outreach [<xref ref-type="bibr" rid="ref3">3</xref>]. Researchers often lack time, institutional support, or training to translate their findings into accessible formats. The data presented here suggest that even minimal support from tools such as Maria Ci&#x00EA;ncia can enable more scientists to participate meaningfully in public engagement by providing formats aligned with the needs of different audiences and reducing technical barriers to communication.</p><p>Complementing subjective evaluations, the readability analyses provide an objective lens through which to interpret these findings. Texts generated by Maria Ci&#x00EA;ncia exhibited a deliberate balance between linguistic complexity and overall legibility. In some audience categories, modest increases in grade level, sentence length, or syllabic density were observed; however, these changes did not consistently translate into lower legibility classifications. Instead, they reflect structural adjustments aimed at preserving informational completeness rather than a loss of accessibility. Readability indices such as the Flesch reading ease, Flesch-Kincaid grade level, Gunning fog index, ARI, Coleman-Liau index, and Gulpease index are widely used in health communication research as proxies for accessibility and audience appropriateness [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Their combined use is particularly valuable for comparative analyses, as it allows systematic assessment of how different communication strategies modulate linguistic complexity while maintaining interpretability. Importantly, readability metrics are not end points: they function as proxies that can be linked to downstream outcomes such as comprehension, perceived credibility, and cognitive load, especially in settings where audiences must navigate competing narratives and misinformation. Lower linguistic complexity and shorter syntactic structures have been associated with improved comprehension and reduced cognitive load, particularly among audiences with limited health literacy, and may support trust-building when messages must compete with misleading narratives in digital environments [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Although readability alone cannot guarantee understanding or prevent misinformation, it provides an objective benchmark for whether outputs are likely to be approachable for nonspecialist readers and therefore serves as a useful complement to subjective quality ratings.</p><p>Direct comparisons with human-written science communication materials further contextualize these results. Human-authored texts consistently demonstrated substantially higher linguistic complexity across nearly all indices, including grade level, sentence length, and lexical density, reinforcing longstanding evidence that expert-driven communication frequently exceeds recommended readability thresholds for lay audiences. In contrast, both Maria Ci&#x00EA;ncia and the base GPT-4.5 model produced texts that were systematically easier to read and more linguistically accessible. While both systems diverged from human writing in the same direction, Maria Ci&#x00EA;ncia&#x2019;s outputs were consistently simpler than those generated by the base model across most metrics. Together, these findings suggest that Maria Ci&#x00EA;ncia does not indiscriminately simplify content but rather modulates textual structure in an audience-dependent manner, supporting improved accessibility without compromising overall legibility.</p><p>Differences observed for health managers are also conceptually expected. Communication for managerial or policy-facing audiences typically prioritizes actionability, decision relevance, and structured synthesis rather than simplified language alone. As a result, evaluation criteria that work well for general audiences may undercapture what makes output useful for managers or policymakers, and future evaluations should incorporate audience-specific criteria tailored to decision-making contexts.</p><p>From an implementation perspective, these characteristics position Maria Ci&#x00EA;ncia as a practical support tool for knowledge translation workflows. Potential applications include integration into journal dissemination processes, public health communication teams, and institutional outreach initiatives, where rapid generation of audience-specific summaries can support timely and responsible dissemination of peer-reviewed evidence. Importantly, such integration should remain coupled with human oversight to ensure scientific fidelity and contextual appropriateness. For example, a journal or research group could (1) identify a newly accepted open-access paper, (2) generate a public-facing summary and a social media post using Maria Ci&#x00EA;ncia, (3) generate a brief manager-facing version highlighting actionable implications, (4) conduct a rapid author or communications-team review for scientific fidelity and tone, and (5) disseminate the finalized outputs through institutional websites, press offices, and social channels. Of note, although not evaluated in this paper, Maria Ci&#x00EA;ncia is also capable of generating images that can help in the dissemination of knowledge. This hypothetical pipeline illustrates how AI-assisted generation can reduce production time while preserving accountability through human review.</p><p>Recent advances in AI also point to future directions for audience-centered health communication tools that extend beyond the scope of this study. Federated learning frameworks, for example, have been increasingly explored in health care to enable collaborative model improvement across institutions while preserving data privacy and regulatory compliance [<xref ref-type="bibr" rid="ref4">4</xref>]. In the context of health communication, such approaches may become relevant for incorporating region- or institution-specific linguistic and cultural patterns without requiring direct sharing of sensitive data. Similarly, developments in self-supervised learning highlight the potential of leveraging large volumes of unlabeled data to improve contextual understanding and adaptability of language models. In health care and related domains, self-supervised approaches have been proposed to enhance prediction and pattern recognition while reducing dependence on costly manual annotation [<xref ref-type="bibr" rid="ref21">21</xref>]. Although not applied in the present work, these principles suggest possible future pathways for improving the adaptability and robustness of AI-assisted communication systems, particularly in settings where labeled training data are scarce or ethically constrained. Together, these developments emphasize that future research should explore how privacy-preserving and data-efficient learning paradigms can complement human oversight in responsible AI-driven health communication.</p><p>As AI-driven science communication tools gain increasing relevance worldwide, it is important to consider their potential for application across diverse international contexts. Although initially developed and evaluated in Brazilian Portuguese, the architecture and prompting framework of Maria Ci&#x00EA;ncia, being built on the GPT platform, allow the tool to operate in over 50 languages with the same ethical and technical standards [<xref ref-type="bibr" rid="ref14">14</xref>]. This provides immediate potential for multilingual deployment in global health communication efforts. However, while the tool can linguistically adapt to multiple languages, effective application across different regions also requires attention to cultural nuances, health literacy variations, and sociolinguistic differences. Linguistic translation alone is insufficient; local framing, terminology, and narrative styles must be carefully adapted to ensure meaningful engagement and to support health literacy and misinformation prevention across diverse public health ecosystems. Accordingly, future work should test culturally grounded adaptation workflows, ideally combining local expert review with community feedback.</p><p>Despite these strengths, this study has limitations. The number of evaluators per target audience was not standardized, and some subgroups, such as health managers and communication professionals, were underrepresented. Author evaluations, while informative, were based on subjective perceptions and not validated against formal scientific fidelity criteria. The evaluation also focused on perception and usability rather than long-term impacts on knowledge retention or behavioral outcomes. Third, children were not included as evaluators. As a result, evaluations of children-focused materials reflect adult perceptions and should be interpreted as preliminary. Furthermore, the tool was primarily tested in Brazilian Portuguese; while the underlying architecture is multilingual, additional research is needed to validate its performance in other languages and cultural contexts.</p><p>Even with these limitations, the evaluation provides a strong foundation to support the validity and utility of the tool. The systematic and transparent development process, combined with broad stakeholder engagement, underscores the potential of Maria Ci&#x00EA;ncia to contribute meaningfully to health literacy and misinformation prevention. Its ability to outperform a baseline GPT model in contextual stability and accuracy further validates the importance of domain-specific configuration for public health applications. Future evaluations will adopt a stratified design in which materials are assessed exclusively by their intended target audiences, using validated instruments and balanced stakeholder representation.</p><p>In summary, Maria Ci&#x00EA;ncia offers a promising avenue for enhancing knowledge translation and addressing the communication challenges posed by health misinformation. As international organizations and national governments have emphasized, combating the impacts of infodemics requires more than reactive correction. It necessitates proactive investment in tools and strategies that produce accessible, trusted, and culturally relevant information. By supporting the generation of audience-adapted materials and facilitating researcher engagement in public dialogue, Maria Ci&#x00EA;ncia contributes to this broader effort to advance scientific literacy and strengthen public health resilience.</p></sec></body><back><ack><p>We gratefully acknowledge Ms Luisa Vinagre and Mr Rodrigo Pontes for their valuable contributions in generating the chatbot outputs used in this study. We also extend our sincere thanks to all anonymous respondents who participated in the evaluation forms, and to Ms Elze Leite for her administrative support throughout the project.</p></ack><notes><sec><title>Funding</title><p>This study was supported by the Intramural Research Program of the Fundac&#x0327;a&#x0303;o Oswaldo Cruz (BBA). BS-P received a fellowship from the Funda&#x00E7;&#x00E3;o de Amparo &#x00E0; Pesquisa da Bahia (FAPESB), KV-S, JNC-O, GP-R, SDM, RRdCS, and MA-P, received fellowships from the Conselho Nacional de Desenvolvimento Cient&#x00ED;fico e Tecnol&#x00F3;gico (CNPq), Brazil. BdBA is a s&#x00EA;nior fellow from the CNPq.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: MA-P, KV-S, BdBA</p><p>Data verification and curation: BS-P, KV-S</p><p>Formal analysis: MA-P, BS-P, GP-R, JNC-O, KV-S</p><p>Funding acquisition: GP-R, BdBA</p><p>Investigation: MA-P, BS-P, KV-S, SDM, JNC-O, RRdCS, BdBA</p><p>Methodology: MA-P, KV-S, SDM, JNC-O, GP-R</p><p>Project administration: MA-P</p><p>Resources: MA-P, BdBA</p><p>Software: MA-P, BS-P, GP-R, JNC-O, KV-S</p><p>Supervision: MA-P, BdBA</p><p>Writing &#x2013; original draft: MA-P, KV-S, GP-R, BS-P</p><p>Writing &#x2013; review and editing: all authors</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">ALT</term><def><p>analysis of language and text</p></def></def-item><def-item><term id="abb3">ARI</term><def><p>automated readability index</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oliveira</surname><given-names>T de</given-names> </name></person-group><article-title>Como enfrentar a desinforma&#x00E7;&#x00E3;o cient&#x00ED;fica? Desafios sociais, pol&#x00ED;ticos e jur&#x00ED;dicos intensificados no contexto da pandemia [Article in Portuguese]</article-title><source>Liinc Rev</source><year>2020</year><month>12</month><day>23</day><volume>16</volume><issue>2</issue><fpage>e5374</fpage><pub-id pub-id-type="doi">10.18617/liinc.v16i2.5374</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Caceres</surname><given-names>MMF</given-names> </name><name name-style="western"><surname>Sosa</surname><given-names>JP</given-names> </name><name name-style="western"><surname>Lawrence</surname><given-names>JA</given-names> </name><etal/></person-group><article-title>The impact of misinformation on the COVID-19 pandemic</article-title><source>AIMS Public Health</source><year>2022</year><volume>9</volume><issue>2</issue><fpage>262</fpage><lpage>277</lpage><pub-id pub-id-type="doi">10.3934/publichealth.2022018</pub-id><pub-id pub-id-type="medline">35634019</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ara&#x00FA;jo-Pereira</surname><given-names>M</given-names> </name><name name-style="western"><surname>Andrade</surname><given-names>BB</given-names> </name></person-group><article-title>The heroic journey of young Brazilian scientists: challenges and opportunities</article-title><source>Lancet Reg Health Am</source><year>2024</year><month>05</month><volume>33</volume><fpage>100735</fpage><pub-id pub-id-type="doi">10.1016/j.lana.2024.100735</pub-id><pub-id pub-id-type="medline">38590323</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abbas</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Abbas</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Zahir</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SW</given-names> </name></person-group><article-title>Federated learning in smart healthcare: a comprehensive review on privacy, security, and predictive analytics with IoT integration</article-title><source>Healthcare (Basel)</source><year>2024</year><month>12</month><day>22</day><volume>12</volume><issue>24</issue><fpage>2587</fpage><pub-id pub-id-type="doi">10.3390/healthcare12242587</pub-id><pub-id pub-id-type="medline">39766014</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hakim</surname><given-names>VGA</given-names> </name><name name-style="western"><surname>Paiman</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Rahman</surname><given-names>MHS</given-names> </name></person-group><article-title>Genie&#x2010;on&#x2010;demand: a custom AI chatbot for enhancing learning performance, self&#x2010;efficacy, and technology acceptance in occupational health and safety for engineering education</article-title><source>Comp Appl Eng</source><year>2024</year><month>11</month><volume>32</volume><issue>6</issue><fpage>e22800</fpage><pub-id pub-id-type="doi">10.1002/cae.22800</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hong</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>Accuracy, satisfaction, and impact of custom GPT in acquiring clinical knowledge: potential for AI-assisted medical education</article-title><source>Med Teach</source><year>2025</year><month>09</month><volume>47</volume><issue>9</issue><fpage>1502</fpage><lpage>1508</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2025.2458808</pub-id><pub-id pub-id-type="medline">39893644</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="thesis"><person-group person-group-type="author"><name name-style="western"><surname>Cunda</surname><given-names>BV</given-names> </name></person-group><article-title>Na ponta das l&#x00ED;nguas: pequeno gloss&#x00E1;rio para apoiar o enfrentamento do estigma e da discrimina&#x00E7;&#x00E3;o [Bachelor&#x2019;s thesis] [Article in Portuguese]</article-title><year>2023</year><access-date>2026-02-17</access-date><publisher-name>Universidade Federal do Rio Grande do Sul</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://lume.ufrgs.br/handle/10183/267984">https://lume.ufrgs.br/handle/10183/267984</ext-link></comment><pub-id pub-id-type="medline">38071171</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="web"><article-title>UNAIDS terminology guidelines</article-title><source>UNAIDS</source><year>2024</year><access-date>2026-02-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.unaids.org/en/resources/documents/2024/terminology_guidelines">https://www.unaids.org/en/resources/documents/2024/terminology_guidelines</ext-link></comment></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="web"><article-title>Terminology guidelines</article-title><source>UNICEF</source><year>2016</year><access-date>2026-02-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.unicef.org/documents/terminology-guidelines">https://www.unicef.org/documents/terminology-guidelines</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="web"><article-title>Frontiers for young minds</article-title><source>Frontiers</source><access-date>2026-02-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://kids.frontiersin.org/">https://kids.frontiersin.org/</ext-link></comment></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Antonof</surname><given-names>G</given-names> </name><name name-style="western"><surname>Rodrigues</surname><given-names>M</given-names> </name><name name-style="western"><surname>Schmidt</surname><given-names>M</given-names> </name></person-group><article-title>Di&#x00E1;logos: um guia para divulga&#x00E7;&#x00E3;o cient&#x00ED;fica em linguagem simples [Article in Portuguese]</article-title><year>2023</year><access-date>2026-02-17</access-date><publisher-name>Universidade de Brasilia</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://bdm.unb.br/bitstream/10483/38689/2/2023_GabrielAntonoff_MateusRodrigues_MateusSilva_produto.pdf">https://bdm.unb.br/bitstream/10483/38689/2/2023_GabrielAntonoff_MateusRodrigues_MateusSilva_produto.pdf</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Paraguassu</surname><given-names>LB</given-names> </name><name name-style="western"><surname>da Costa</surname><given-names>CV</given-names> </name></person-group><article-title>ICICT simple language guide [Article in Portuguese]</article-title><year>2023</year><access-date>2026-02-17</access-date><publisher-name>Oswaldo Cruz Foundation. Institute of Scientific and Technological Communication and Information in Health</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.arca.fiocruz.br/handle/icict/61432">https://www.arca.fiocruz.br/handle/icict/61432</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="web"><source>Profiss&#x00E3;o Biotec</source><access-date>2026-02-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://profissaobiotec.com.br/">https://profissaobiotec.com.br/</ext-link></comment></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="web"><article-title>How to change your language setting in ChatGPT</article-title><source>OpenAI</source><access-date>2026-02-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://help.openai.com/en/articles/8357869-how-to-change-your-language-setting-in-chatgpt">https://help.openai.com/en/articles/8357869-how-to-change-your-language-setting-in-chatgpt</ext-link></comment></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moreno</surname><given-names>G de L</given-names> </name><name name-style="western"><surname>de Souza</surname><given-names>MPM</given-names> </name><name name-style="western"><surname>Hein</surname><given-names>N</given-names> </name><name name-style="western"><surname>Hein</surname><given-names>AK</given-names> </name></person-group><article-title>ALT: um software para an&#x00E1;lise de legibilidade de textos em l&#x00ED;ngua portuguesa [Article in Portuguese]</article-title><source>Policromias</source><year>2023</year><volume>8</volume><issue>1</issue><fpage>91</fpage><lpage>128</lpage><pub-id pub-id-type="doi">10.61358/policromias.v8i1.54352</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tiwary</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rimal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Paudyal</surname><given-names>B</given-names> </name><name name-style="western"><surname>Sigdel</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Basnyat</surname><given-names>B</given-names> </name></person-group><article-title>Poor communication by health care professionals may lead to life-threatening complications: examples from two case reports</article-title><source>Wellcome Open Res</source><year>2019</year><volume>4</volume><fpage>7</fpage><pub-id pub-id-type="doi">10.12688/wellcomeopenres.15042.1</pub-id><pub-id pub-id-type="medline">31448336</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boutemen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Miller</surname><given-names>AN</given-names> </name></person-group><article-title>Readability of publicly available mental health information: a systematic review</article-title><source>Patient Educ Couns</source><year>2023</year><month>06</month><volume>111</volume><fpage>107682</fpage><pub-id pub-id-type="doi">10.1016/j.pec.2023.107682</pub-id><pub-id pub-id-type="medline">36944285</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mendez</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Galvez</surname><given-names>SMN</given-names> </name><name name-style="western"><surname>Emmons</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Viswanath</surname><given-names>K</given-names> </name></person-group><article-title>Reading grade level estimates of public health communication on social media vary due to text preprocessing</article-title><source>J Health Commun</source><year>2025</year><volume>30</volume><issue>10-12</issue><fpage>634</fpage><lpage>640</lpage><pub-id pub-id-type="doi">10.1080/10810730.2025.2583460</pub-id><pub-id pub-id-type="medline">41204693</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eslami</surname><given-names>H</given-names> </name></person-group><article-title>The effect of syntactic simplicity and complexity on the readability of the text</article-title><source>JLTR</source><year>2014</year><month>09</month><day>1</day><volume>5</volume><issue>5</issue><fpage>1185</fpage><lpage>1191</lpage><pub-id pub-id-type="doi">10.4304/jltr.5.5.1185-1191</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mac</surname><given-names>O</given-names> </name><name name-style="western"><surname>Ayre</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bell</surname><given-names>K</given-names> </name><name name-style="western"><surname>McCaffery</surname><given-names>K</given-names> </name><name name-style="western"><surname>Muscat</surname><given-names>DM</given-names> </name></person-group><article-title>Comparison of readability scores for written health information across formulas using automated vs manual measures</article-title><source>JAMA Netw Open</source><year>2022</year><month>12</month><day>1</day><volume>5</volume><issue>12</issue><fpage>e2246051</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2022.46051</pub-id><pub-id pub-id-type="medline">36508219</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdulrazzaq</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Ramaha</surname><given-names>NTA</given-names> </name><name name-style="western"><surname>Hameed</surname><given-names>AA</given-names> </name><etal/></person-group><article-title>Consequential advancements of self-supervised learning (SSL) in deep learning contexts</article-title><source>Mathematics</source><year>2024</year><month>03</month><day>2</day><volume>12</volume><issue>5</issue><fpage>758</fpage><pub-id pub-id-type="doi">10.3390/math12050758</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>List of comments, and comparative accuracy and context stability evaluation table.</p><media xlink:href="infodemiology_v6i1e78843_app1.docx" xlink:title="DOCX File, 26 KB"/></supplementary-material></app-group></back></article>