<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="letter"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v28i1e101910</article-id><article-id pub-id-type="doi">10.2196/101910</article-id><article-categories><subj-group subj-group-type="heading"><subject>Letter to the Editor</subject></subj-group></article-categories><title-group><article-title>Beyond Visual Consensus: Tiered Reference Framework for AI Cystoscopy Studies</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Bayraktar</surname><given-names>Ahmet Murat</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>&#x0130;&#x015F;ler</surname><given-names>Bilgi</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff id="aff1"><institution>Department of Urology, Konya City Hospital</institution><addr-line>Akabe Mah, Adana &#x00C7;evre Yolu Cad. No.135 Karatay</addr-line><addr-line>Konya</addr-line><country>Turkey</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Leung</surname><given-names>Tiffany</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Ahmet Murat Bayraktar, MD, Department of Urology, Konya City Hospital, Akabe Mah, Adana &#x00C7;evre Yolu Cad. No.135 Karatay, Konya, 42020, Turkey, 90 332310000 ext 21022; <email>drahmetbayraktar@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>18</day><month>6</month><year>2026</year></pub-date><volume>28</volume><elocation-id>e101910</elocation-id><history><date date-type="received"><day>20</day><month>05</month><year>2026</year></date><date date-type="rev-recd"><day>22</day><month>05</month><year>2026</year></date><date date-type="accepted"><day>04</day><month>06</month><year>2026</year></date></history><copyright-statement>&#x00A9; Ahmet Murat Bayraktar, Bilgi &#x0130;&#x015F;ler. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 18.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2026/1/e101910"/><related-article related-article-type="commentary article" ext-link-type="doi" xlink:href="10.2196/87193" xlink:title="Comment on" xlink:type="simple">https://www.jmir.org/2026/1/e87193</related-article><related-article related-article-type="commentary" ext-link-type="doi" xlink:href="10.2196/103335" xlink:title="Comment in" xlink:type="simple">https://www.jmir.org/2026/1/e103335</related-article><kwd-group><kwd>multimodal</kwd><kwd>large language model</kwd><kwd>AI</kwd><kwd>cystoscopy</kwd><kwd>diagnostic reasoning</kwd><kwd>finding description</kwd><kwd>biopsy indication</kwd><kwd>bladder tumor</kwd><kwd>artificial intelligence</kwd></kwd-group></article-meta></front><body><p>We read with great interest the study by Shih et al [<xref ref-type="bibr" rid="ref1">1</xref>], a valuable contribution to the emerging field of artificial intelligence (AI)&#x2013;assisted cystoscopic diagnosis. Their blinded evaluation of four multimodal large language models across 401 images encompassing 40 cystoscopic finding subcategories provides important insights into current model capabilities. We wish to raise a methodological consideration regarding the reference standard that may inform the interpretation of the reported findings.</p><p>The reference standard in this study was established through visual consensus between two urologists, without histopathological confirmation. While interexpert agreement was satisfactory (&#x03BA;=0.81), cystoscopic impression alone has well-documented limitations. Cina et al [<xref ref-type="bibr" rid="ref2">2</xref>] demonstrated that experienced urologists could not reliably distinguish between low- and high-grade papillary lesions endoscopically, with complete grade-stage concordance with histopathology in only 70.3% of cases and a specificity of just 57% for predicting lamina propria invasion. A visually derived reference standard thus carries inherent diagnostic uncertainty.</p><p>This concern is particularly relevant for lesion categories central to the study&#x2019;s 7-class task. Carcinoma in situ (CIS) is notoriously difficult to identify under white light cystoscopy; blue light cystoscopy studies have demonstrated that approximately one-third of CIS lesions are missed by white light alone [<xref ref-type="bibr" rid="ref3">3</xref>]. Similarly, the frequent misclassification of papilloma as papillary urothelial carcinoma&#x2014;acknowledged by the authors as reflecting substantial macroscopic overlap [<xref ref-type="bibr" rid="ref1">1</xref>]&#x2014;underscores that definitive classification of these entities requires histological evaluation of architectural and cytological features indistinguishable on endoscopic inspection.</p><p>The AI-assisted cystoscopic diagnosis literature has converged on histopathological confirmation as the reference standard. Foundational work such as CystoNet was trained and validated on histologically confirmed lesions [<xref ref-type="bibr" rid="ref4">4</xref>], and a recent systematic review by Hengky et al [<xref ref-type="bibr" rid="ref5">5</xref>] restricted inclusion to studies using histopathology as the reference standard. This consensus reflects the clinical reality that the categorical distinctions central to bladder lesion classification&#x2014;low- versus high-grade carcinoma, CIS versus inflammation, papilloma versus carcinoma&#x2014;ultimately rest on histological criteria and drive subsequent management.</p><p>We acknowledge the logistical challenges of obtaining histopathology for every image in a large, multisource dataset, particularly for benign-appearing or nonresected findings. We, therefore, suggest that future benchmarking studies adopt a tiered reference framework: (1) histopathologically confirmed labels for all lesions undergoing biopsy or resection, encompassing the full malignant spectrum; (2) enhanced cystoscopy correlation (blue light or narrow band imaging) as an intermediate standard, particularly for CIS [<xref ref-type="bibr" rid="ref3">3</xref>]; and (3) consensus visual labels&#x2014;explicitly flagged as lower confidence&#x2014;for benign categories unlikely to undergo biopsy in routine practice. Stratified performance reporting under such a framework would allow readers to separate genuine algorithmic limitations from ambiguity inherent to the reference standard, providing a more clinically meaningful evaluation.</p></body><back><ack><p>The authors acknowledge the use of generative artificial intelligence (Google Gemini) for language editing and proofreading assistance during the preparation of this manuscript.</p></ack><notes><sec><title>Funding</title><p>The authors declared no financial support was received for this work.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">CIS</term><def><p>carcinoma in situ</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shih</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>CY</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Tsai</surname><given-names>CY</given-names> </name></person-group><article-title>Multimodal large language models for cystoscopic image interpretation and bladder lesion classification: comparative study</article-title><source>J Med Internet Res</source><year>2026</year><month>01</month><day>28</day><volume>28</volume><fpage>e87193</fpage><pub-id pub-id-type="doi">10.2196/87193</pub-id><pub-id pub-id-type="medline">41605505</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cina</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Epstein</surname><given-names>JI</given-names> </name><name name-style="western"><surname>Endrizzi</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Harmon</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Seay</surname><given-names>TM</given-names> </name><name name-style="western"><surname>Schoenberg</surname><given-names>MP</given-names> </name></person-group><article-title>Correlation of cystoscopic impression with histologic diagnosis of biopsy specimens of the bladder</article-title><source>Hum Pathol</source><year>2001</year><month>06</month><volume>32</volume><issue>6</issue><fpage>630</fpage><lpage>637</lpage><pub-id pub-id-type="doi">10.1053/hupa.2001.24999</pub-id><pub-id pub-id-type="medline">11431718</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grossman</surname><given-names>HB</given-names> </name><name name-style="western"><surname>Gomella</surname><given-names>L</given-names> </name><name name-style="western"><surname>Fradet</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>A phase III, multicenter comparison of hexaminolevulinate fluorescence cystoscopy and white light cystoscopy for the detection of superficial papillary lesions in patients with bladder cancer</article-title><source>J Urol</source><year>2007</year><month>07</month><volume>178</volume><issue>1</issue><fpage>62</fpage><lpage>67</lpage><pub-id pub-id-type="doi">10.1016/j.juro.2007.03.034</pub-id><pub-id pub-id-type="medline">17499283</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shkolyar</surname><given-names>E</given-names> </name><name name-style="western"><surname>Jia</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>TC</given-names> </name><etal/></person-group><article-title>Augmented bladder tumor detection using deep learning</article-title><source>Eur Urol</source><year>2019</year><month>12</month><volume>76</volume><issue>6</issue><fpage>714</fpage><lpage>718</lpage><pub-id pub-id-type="doi">10.1016/j.eururo.2019.08.032</pub-id><pub-id pub-id-type="medline">31537407</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hengky</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lionardi</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Kusumajaya</surname><given-names>C</given-names> </name></person-group><article-title>Can artificial intelligence aid the urologists in detecting bladder cancer?</article-title><source>Indian J Urol</source><year>2024</year><volume>40</volume><issue>4</issue><fpage>221</fpage><lpage>228</lpage><pub-id pub-id-type="doi">10.4103/iju.iju_39_24</pub-id><pub-id pub-id-type="medline">39555437</pub-id></nlm-citation></ref></ref-list></back></article>