<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i3e21695</article-id>
      <article-id pub-id-type="pmid">33764307</article-id>
      <article-id pub-id-type="doi">10.2196/21695</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Reducing the Impact of Confounding Factors on Skin Cancer Classification via Image Segmentation: Technical Model Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Cheng</surname>
            <given-names>Chi-Tung</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Frontoni</surname>
            <given-names>Emanuele</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Robinson</surname>
            <given-names>June</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Maron</surname>
            <given-names>Roman C</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2120-901X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Hekler</surname>
            <given-names>Achim</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4974-2457</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Krieghoff-Henning</surname>
            <given-names>Eva</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8381-3100</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Schmitt</surname>
            <given-names>Max</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5133-6768</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Schlager</surname>
            <given-names>Justin G</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8607-9367</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Utikal</surname>
            <given-names>Jochen S</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5316-0241</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Brinker</surname>
            <given-names>Titus J</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Digital Biomarkers for Oncology Group</institution>
            <institution>National Center for Tumor Diseases (NCT)</institution>
            <institution>German Cancer Research Center (DKFZ)</institution>
            <addr-line>Im Neuenheimer Feld 280</addr-line>
            <addr-line>Heidelberg, 69120</addr-line>
            <country>Germany</country>
            <phone>49 6221 3219304</phone>
            <email>titus.brinker@dkfz.de</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3620-5919</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Digital Biomarkers for Oncology Group</institution>
        <institution>National Center for Tumor Diseases (NCT)</institution>
        <institution>German Cancer Research Center (DKFZ)</institution>
        <addr-line>Heidelberg</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Dermatology and Allergy</institution>
        <institution>University Hospital</institution>
        <institution>LMU Munich</institution>
        <addr-line>Munich</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Dermatology</institution>
        <institution>Heidelberg University</institution>
        <addr-line>Mannheim</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Skin Cancer Unit</institution>
        <institution>German Cancer Research Center (DKFZ)</institution>
        <addr-line>Heidelberg</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Titus J Brinker <email>titus.brinker@dkfz.de</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>3</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>25</day>
        <month>3</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>3</issue>
      <elocation-id>e21695</elocation-id>
      <history>
        <date date-type="received">
          <day>22</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>28</day>
          <month>10</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>13</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>8</day>
          <month>2</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Roman C Maron, Achim Hekler, Eva Krieghoff-Henning, Max Schmitt, Justin G Schlager, Jochen S Utikal, Titus J Brinker. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 25.03.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/3/e21695" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Studies have shown that artificial intelligence achieves similar or better performance than dermatologists in specific dermoscopic image classification tasks. However, artificial intelligence is susceptible to the influence of confounding factors within images (eg, skin markings), which can lead to false diagnoses of cancerous skin lesions. Image segmentation can remove lesion-adjacent confounding factors but greatly change the image representation.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to compare the performance of 2 image classification workflows where images were either segmented or left unprocessed before the subsequent training and evaluation of a binary skin lesion classifier.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Separate binary skin lesion classifiers (nevus vs melanoma) were trained and evaluated on segmented and unsegmented dermoscopic images. For a more informative result, separate classifiers were trained on 2 distinct training data sets (human against machine [HAM] and International Skin Imaging Collaboration [ISIC]). Each training run was repeated 5 times. The mean performance of the 5 runs was evaluated on a multi-source test set (n=688) consisting of a holdout and an external component.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our findings showed that when trained on HAM, the segmented classifiers showed a higher overall balanced accuracy (75.6% [SD 1.1%]) than the unsegmented classifiers (66.7% [SD 3.2%]), which was significant in 4 out of 5 runs (<italic>P</italic>&#60;.001). The overall balanced accuracy was numerically higher for the unsegmented ISIC classifiers (78.3% [SD 1.8%]) than for the segmented ISIC classifiers (77.4% [SD 1.5%]), which was significantly different in 1 out of 5 runs (<italic>P</italic>=.004).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Image segmentation does not result in overall performance decrease but it causes the beneficial removal of lesion-adjacent confounding factors. Thus, it is a viable option to address the negative impact that confounding factors have on deep learning models in dermatology. However, the segmentation step might introduce new pitfalls, which require further investigations.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>dermatology</kwd>
        <kwd>diagnosis</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>neural networks</kwd>
        <kwd>image segmentation</kwd>
        <kwd>confounding factors</kwd>
        <kwd>artifacts</kwd>
        <kwd>melanoma</kwd>
        <kwd>nevus</kwd>
        <kwd>deep learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Deep learning models have achieved impressive results in dermoscopic image skin cancer classification, as exemplified by a range of studies on binary and multiclass classification tasks [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. The creation of open-source dermoscopic image databases [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>] has enabled much of the current research in this area by facilitating the training and evaluation of deep learning models. Supervised learning is commonly used, where the deep learning model is trained on labeled training data (eg, dermoscopic image plus its corresponding diagnosis), and it continually optimizes its internal parameters. This produces an inferred function that ideally classifies previously unseen data correctly based on a valid strategy (eg, in the case of skin lesions, based on relevant biological and structural features). However, it is not uncommon for deep learning models to learn spurious correlations within the training data. As a result, these models fail when evaluating data not exhibiting the respective correlations. In image analysis, such correlations are often introduced by visual artifacts, which act as confounding factors and have been observed to result in performance degradation [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. A recent dermatology study showed that skin markings significantly interfered with the correct diagnosis of nevi by deep learning convolutional neural networks (CNNs) by increasing the melanoma probability scores and consequently, the false-positive rate [<xref ref-type="bibr" rid="ref11">11</xref>]. Besides skin markings with stains/ink, a variety of artifacts are encountered in public and proprietary dermoscopic image databases, such as dark image corners, gel bubbles, color charts, ruler marks, or skin hairs (see <xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
      <p>A variety of strategies have been proposed to tackle confounding factors such as digital hair removal, image cropping, or image segmentation [<xref ref-type="bibr" rid="ref12">12</xref>]. In image segmentation, an image is partitioned into 2 or more regions so that each region can be analyzed on its own. Dermoscopic image segmentation usually partitions the image into foreground (lesion) and background (surrounding skin, see <xref rid="figure1" ref-type="fig">Figure 1</xref>). This preprocessing approach has the advantage that it not only simplifies the representation of the image but also removes the surrounding artifacts. Theoretically, the image fed to the deep learning model after segmentation consists mainly of the lesion, which presumably contains the most information but the least confounding factors.</p>
      <p>In this study, we therefore determined if and how image segmentation affects skin lesion classification performance of deep learning–based algorithms. We compared the performance of 2 workflows: one where skin lesion classifiers were trained by a traditional end-to-end approach on unsegmented dermoscopic images and one where classifiers were trained by a two-step approach on images that have undergone prior segmentation.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Typical artifacts encountered in dermoscopic image databases. Panels A-D show an exemplary range of artifacts often found in dermoscopic images, which are (left to right) color charts and hair, text, ruler markings, and marker ink. Panels E-H show how a corresponding segmented image could look like, with the surrounding artifacts removed but artifacts within the lesion (Panel E) still visible.</p>
        </caption>
        <graphic xlink:href="jmir_v23i3e21695_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>Binary classifiers (nevus vs melanoma) were trained on 2 different data sets and on unsegmented or segmented images, respectively, resulting in 4 separate types of classifiers. All classifiers were evaluated on a test set (n=688) consisting of 1 holdout component (n=200) and 3 external components (n=488). For each classifier type, 5 training and testing runs were performed in order to obtain robust performance estimates, which encompass the stochastic nature of the training process (see <xref rid="figure2" ref-type="fig">Figure 2</xref>). Ethics approval was waived by the ethics committee of the University of Heidelberg, as images were open source and anonymous.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Flowchart of the study design. A training data set consisting of images from 2 different sources was either segmented or not segmented and split into 2 smaller partitions based on image origin (HAM or ISIC). An individual classifier was then trained on each of the 4 training sets and evaluated on a multi-source test set, which underwent a preprocessing step that equaled the training data preprocessing. Training and evaluation were repeated a total of 5 times for a more robust measure. HAM: human against machine data set; ISIC: international skin imaging collaboration data set; PH2: hospital Pedro Hispano data set; PROP: proprietary data set.</p>
          </caption>
          <graphic xlink:href="jmir_v23i3e21695_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Sets</title>
        <p>Dermoscopic images for developing the segmentation model were obtained from task 1 of the International Skin Imaging Collaboration (ISIC) 2018 challenge [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. This data set is already split into a training, validation, and test set by the challenge organizers and contains dermoscopic lesion images together with a binary image mask, which partitions the image into a background (areas outside the primary lesion) and foreground (areas inside the primary lesion). This mask represents the “ground truth” with respect to the correct partitioning of the images. Dermoscopic images for developing the skin lesion classifiers were obtained from 2 sources: from part 3 of the ISIC 2017 challenge [<xref ref-type="bibr" rid="ref6">6</xref>] and from the human against machine (HAM) data set [<xref ref-type="bibr" rid="ref7">7</xref>]. Both data sets are mutually exclusive, with the HAM data set showing considerably fewer artifacts than the ISIC data set. Duplicated images within the HAM data set were removed prior to splitting the data set into the training, validation, and test set. The ISIC 2017 challenge data set had already been split by the challenge organizers.</p>
        <p>Two additional external data sets were used for classifier evaluation. The first data set is publicly available and contains dermoscopic images acquired at the Dermatology Service of Hospital Pedro Hispano (PH2), Matosinhos, Portugal [<xref ref-type="bibr" rid="ref8">8</xref>]. The second data set is proprietary (PROP) and contains dermoscopic images acquired from the Department of Dermatology and Allergy, University Hospital, LMU Munich, Munich and from the Department of Dermatology, Heidelberg University, Mannheim. Both data sets also contain some of the artifacts observed in ISIC and HAM, such as black image corners, rulers, or skin markings. As PH2 also contains binary image masks from dermatologists, this data set was also used for the evaluation of the segmentation model. Details on the training, validation, and test set composition are listed in Table S1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Segmentation Model and Classifier Development</title>
        <p>For image segmentation, a CNN in the form of a U-Net was employed [<xref ref-type="bibr" rid="ref14">14</xref>]. The model’s raw output, which consists of a binary image mask, was further automatically processed by removing noise, closing holes, and replacing empty masks. Skin lesion classifiers were generated using a ResNet50 architecture, which was pretrained on ImageNet. For details on segmentation model and classifier development, refer to the supplementary methods (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      </sec>
      <sec>
        <title>Analysis</title>
        <p>The segmentation model’s performance was evaluated using a thresholded mean Jaccard index, a score between 0 and 1, which measures the similarity between the ground truth mask and the model’s output mask. The threshold was based on the ISIC 2018 challenge and set to 0.65, meaning that any lower scores were set to 0. The performance for each individual classifier was measured using balanced accuracy as the primary endpoint, with sensitivity, specificity, and area under the receiver operating characteristic curve (AUROC) as secondary endpoints. As we repeated each classifier training and evaluation step 5 times, metrics were first computed for each individual classifier and then averaged to obtain a mean performance measure. Performance comparisons were carried out between the preprocessing methods (ie, segmented vs unsegmented) and not between the underlying training data sets (ie, not HAM vs ISIC). Thus, we compared HAM segmented to HAM unsegmented and ISIC segmented to ISIC unsegmented but not HAM segmented to ISIC segmented. Statistical significance was evaluated for the primary endpoint by using a two-sided McNemar test and considered significant at <italic>P</italic>&#60;.005 (Bonferroni correction by a factor of 10) to account for multiple testing when comparing the individual segmented HAM/ISIC classifiers to unsegmented HAM/ISIC classifiers for each of the 5 runs (one-on-one comparison). <italic>P</italic> values are listed only for significant runs.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Segmentation Model Performance</title>
        <p>The thresholded Jaccard index on the ISIC holdout test set for the segmentation model after mask postprocessing was 0.75 and increased to 0.81 on the external PH2 set.</p>
      </sec>
      <sec>
        <title>Classifier Performance</title>
        <p>The overall balanced accuracy was numerically higher for the unsegmented ISIC classifiers (78.3% [SD 1.8%]) than for the segmented ISIC classifiers (77.4% [SD 1.5%]). This was significantly different in 1 out of 5 runs (<italic>P</italic>=.004). When trained on HAM, the segmented classifiers showed a higher overall balanced accuracy (75.6% [SD 1.1%]) than the unsegmented classifiers (66.7% [SD 3.2%]). This difference was significant for 4 out of the 5 classifiers (<italic>P</italic>&#60;.001). A subanalysis of the performance on the holdout and external test set component shows that segmented classifiers had a numerically higher overall balanced accuracy on the external component than unsegmented classifiers, regardless of the data set source (see <xref ref-type="table" rid="table1">Table 1</xref>). The reverse trend was observed for the holdout component. AUROC followed the same trends as mean balanced accuracy.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>
            Overview of the balanced accuracy and area under the receiver operating characteristic curve for each type of classifier across the holdout, external, and overall test set.
            
            </p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="290"/>
            <col width="0"/>
            <col width="170"/>
            <col width="0"/>
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td rowspan="2" colspan="2">Test set components, metric</td>
                <td colspan="6">Trained classifiers</td>
              </tr>
              <tr valign="bottom">
                <td colspan="2">HAM<sup>a</sup> segmented (%)</td>
                <td colspan="2">HAM unsegmented (%)</td>
                <td>ISIC<sup>b</sup> segmented (%)</td>
                <td>ISIC unsegmented (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>Holdout</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Balanced accuracy, mean (SD)</td>
                <td colspan="2">87.6 (1.4)</td>
                <td>
                  <italic>89.4 (0.9)</italic>
                  <sup>c</sup>
                </td>
                <td>77.1 (1.5)</td>
                <td>
                  <italic>80.0 (2.6)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">AUROC<sup>d</sup>, mean (SD)</td>
                <td colspan="2">0.95 (0.006)</td>
                <td>
                  <italic>0.964 (0.002)</italic>
                </td>
                <td>0.839 (0.008)</td>
                <td>
                  <italic>0.89 (0.1)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>External</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Balanced accuracy, mean (SD)</td>
                <td colspan="2">
                  <italic>69.9 (1.3)</italic>
                </td>
                <td>57.6 (4.1)</td>
                <td>
                  <italic>78.2 (1.6)</italic>
                </td>
                <td>77.6 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">AUROC, mean (SD)</td>
                <td colspan="2">
                  <italic>0.765 (0.011)</italic>
                </td>
                <td>0.647 (0.025)</td>
                <td>
                  <italic>0.874 (0.005)</italic>
                </td>
                <td>0.851 (0.018)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Overall</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Balanced accuracy, mean (SD)</td>
                <td colspan="2">
                  <italic>75.6 (1.1)</italic>
                </td>
                <td>66.7 (3.2)</td>
                <td>77.4 (1.5)</td>
                <td>
                  <italic>78.3 (1.8)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">AUROC, mean (SD)</td>
                <td colspan="2">
                  <italic>0.841 (0.008)</italic>
                </td>
                <td>0.763 (0.02)</td>
                <td>0.856 (0.005)</td>
                <td>
                  <italic>0.862 (0.014)</italic>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>HAM: human against machine data set.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>ISIC: International Skin Imaging Collaboration data set.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>The italicized data indicate the higher metric when comparing between classifiers trained on a segmented/unsegmented version of the same data set.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>ISIC classifiers (regardless of preprocessing) show a comparable balanced accuracy across the holdout and external test set components, resulting in a similar balanced accuracy for the overall test set. In contrast, the segmented HAM classifiers show a substantially higher overall balanced accuracy to the unsegmented HAM classifiers. This better overall balanced accuracy stems from a visible performance difference on the external test set component, which is largely driven by a drop in the balanced accuracy for PH2. Here, the balanced accuracy of unsegmented HAM classifiers was 63.2% (SD 7.1%) compared to 84.4% (SD 2.9%) for the segmented HAM classifiers (see <xref ref-type="table" rid="table2">Table 2</xref>). Equivalent tables showing the results for the metric sensitivity and specificity are found in Table S2 and Table S3 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>
            Overview of the balanced accuracy and area under the receiver operating characteristic curve for each type of classifier across the external test set’s 3 individual components.
            
            </p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="290"/>
            <col width="0"/>
            <col width="170"/>
            <col width="0"/>
            <col width="170"/>
            <col width="0"/>
            <col width="170"/>
            <col width="0"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td rowspan="2" colspan="3">External test set components, metric</td>
                <td colspan="7">Trained classifiers</td>
              </tr>
              <tr valign="bottom">
                <td colspan="2">HAM<sup>a</sup> segmented (%)</td>
                <td colspan="2">HAM unsegmented (%)</td>
                <td colspan="2">ISIC<sup>b</sup> segmented (%)</td>
                <td>ISIC unsegmented (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="10">
                  <bold>HAM/ISIC<sup>c</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Balanced accuracy, mean (SD)</td>
                <td colspan="2">
                  <italic>61.0 (1.3)</italic>
                  <sup>d</sup>
                </td>
                <td colspan="2">58.9 (3.1)</td>
                <td colspan="2">74.1 (3.6)</td>
                <td colspan="2">
                  <italic>76.5 (1.8)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AUROC<sup>e</sup>, mean (SD)</td>
                <td colspan="2">0.628 (0.005)</td>
                <td colspan="2">
                  <italic>0.636 (0.023)</italic>
                </td>
                <td colspan="2">0.827 (0.019)</td>
                <td colspan="2">
                  <italic>0.851 (0.022)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>PH2<sup>f</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Balanced accuracy, mean (SD)</td>
                <td colspan="2">
                  <italic>84.4 (2.9)</italic>
                </td>
                <td colspan="2">63.2 (7.1)</td>
                <td colspan="2">
                  <italic>86.4 (1.3)</italic>
                </td>
                <td colspan="2">83.7 (0.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AUROC, mean (SD)</td>
                <td colspan="2">
                  <italic>0.928 (0.022)</italic>
                </td>
                <td colspan="2">0.894 (0.021)</td>
                <td colspan="2">
                  <italic>0.947 (0.007)</italic>
                </td>
                <td colspan="2">0.912 (0.018)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>PROP<sup>g</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Balanced accuracy, mean (SD)</td>
                <td colspan="2">71.1 (1.8)</td>
                <td colspan="2">
                  <italic>75.7 (4.2)</italic>
                </td>
                <td colspan="2">68.7 (1.6)</td>
                <td colspan="2">
                  <italic>74.6 (2.8)</italic>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AUROC, mean (SD)</td>
                <td colspan="2">0.825 (0.033)</td>
                <td colspan="2">
                  <italic>0.857 (0.034)</italic>
                </td>
                <td colspan="2">
                  <italic>0.88 (0.025)</italic>
                </td>
                <td colspan="2">0.814 (0.015)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>HAM: human against machine data set.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>ISIC: International Skin Imaging Collaboration data set.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>If classifiers were trained on HAM images, the first external test set component consists of ISIC and vice versa.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>The italicized data indicate the higher metric when comparing between classifiers trained on a segmented/unsegmented version of the same data set.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>PH2: hospital Pedro Hispano data set.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>PROP: proprietary data set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Additional Analyses</title>
        <p>Some additional analyses were carried out based on the obtained results. As the unsegmented HAM classifiers showed poor performance on PH2 with high sensitivity (95.5% [SD 1.9%]) but low specificity (30.9% [SD 13.6%], Table S3 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), their performance was again evaluated on cropped unsegmented PH2 images. As the PH2 data set consists of images with predominantly black corners (see <xref rid="figure3" ref-type="fig">Figure 3</xref>), we speculated that these could be artifacts, which caused the drop in performance. We therefore manually cropped all unsegmented PH2 images just enough so that any black corner was removed. On cropped PH2 images, specificity increased to 65.8% (SD 8.3%) at almost unchanged sensitivity of 93.5% (SD 3%), resulting in an overall mean balanced accuracy of 79.6% (SD 3.8%). As the unsegmented ISIC classifiers showed a comparable performance to the segmented ISIC classifiers, there was no reason to assume that these classifiers are also negatively influenced by black image corners. However, when its performance was evaluated on cropped PH2, sensitivity decreased from 82% (SD 2.9%) (unsegmented) to 67.5% (SD 5.7%) (cropped) with specificity increasing from 85.4% (SD 2.8%) to 89.4% (SD 1.7%), resulting in a change of mean balanced accuracy from 83.7% (SD 0.8%) to 78.4% (SD 3.6%).</p>
        <p>As ground truth segmentation masks were available for the PH2 data set, PH2 images were experimentally segmented using these masks instead of the masks produced by the segmentation model and subsequently used for evaluation. These masks were produced by an expert dermatologist; therefore, a similar performance was expected. However, segmented HAM and ISIC classifiers showed a lower balanced accuracy for PH2 images when processed by the ground truth masks (82% [SD 2.2%] and 76.1% [SD 2.9%], respectively) as opposed to the segmentation model mask (84.4% [SD 2.9%] and 86.4% [SD 1.3%], respectively). This change resulted from a drop in specificity from 80.2% (SD 3.8%) and 82.4% (SD 5.0%) to 76.5% (SD 5.6%) and 63.2% (SD 9.7%) at almost constant sensitivity (88.5% [SD 5.1%] and 90.5% [SD 3.7%] vs 87.5% [SD 5.0%] and 89.0% [SD 5.1%], respectively).</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Exemplary predictions of a classifier trained on unsegmented HAM (left) and ISIC (right) images and evaluated on unsegmented and cropped PH2 images. The target class (ground truth) for each lesion is displayed to the left, with the classifier’s output probability for the target class on top. An output probability larger than 50% corresponds to a correct classification, which is also indicated by a blue frame, whereas an orange frame denotes an incorrect classification. HAM: human against machine data set; ISIC: international skin imaging collaboration data set; PH2: hospital Pedro Hispano data set.</p>
          </caption>
          <graphic xlink:href="jmir_v23i3e21695_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Overview of the Study</title>
        <p>In this study, we established and compared the performance of 2 classification workflows. The first workflow did not include a preprocessing step, and training and test set images were unmodified. The second included preprocessing where images were segmented prior to classifier training and evaluation. For training, we used 2 distinct training data sets (HAM and ISIC) and established the performance on a multi-source test set. Our findings show that while performance is highly dependent on the source of the training and test set, segmentation does not lead to an overall decrease in the performance of a ResNet50 architecture and may even lead to an improved classifier, which is presumably at a decreased risk to suffer from common lesion-adjacent confounding factors.</p>
      </sec>
      <sec>
        <title>Principal Results</title>
        <p>The overall comparable performance of classifiers trained on segmented and unsegmented images shows that classifiers are able to distinguish melanoma from nevus images based largely on the lesion itself without requiring the surrounding skin area for additional information. This is not unexpected as visual inspection by dermatologists also mainly focuses on global and local features within the lesion, although features such as increased vascularization of the surrounding skin and lesions on sun-damaged or aged skin are associated with a higher risk of skin cancer and can thus be used as cues. While segmentation requires an extra step compared to end-to-end classification, it may be worthwhile as proper segmentation removes potential preexisting confounding factors surrounding the lesion (albeit not within the lesion, eg, hairs, overlapping rulers). Given the prevalence and large variety of artifacts in public dermoscopic databases such as ISIC, such measures are warranted to counteract the possibility of the classifier incorporating confounding factors in its decision process. For example, gentian violet skin markers were previously shown to be associated with a higher melanoma probability by a CNN approved for use as a medical device in the European market [<xref ref-type="bibr" rid="ref11">11</xref>]. As artifact perception by a CNN-based classifier is dependent on the constitution of the underlying training data, this finding is not necessarily applicable to other CNN-based classifiers but highlights the negative impact of artifacts that may manifest themselves in a variety of ways. In this study, we hypothesize that classifiers trained on unsegmented HAM and ISIC images correlate black image corners with the occurrence of melanoma, albeit to varying degrees. Both unsegmented classifiers were evaluated on unsegmented and cropped PH2 images, where cropping completely removed the black corners (see <xref rid="figure3" ref-type="fig">Figure 3</xref>). In both cases, specificity increased when using cropped PH2 images. Sensitivity remained almost unchanged for the HAM classifiers and decreased for the ISIC classifiers, suggesting that classifiers trained on either training set associate black image corners with melanoma, but weigh its importance differently. Alternatively, it cannot be ruled out that the observed performance change stems from the cropping process, which introduces resolution changes, image distortions, and the removal of potentially relevant biological information if parts of the lesion are cropped out. However, given the one-sided performance increase (ie, for specificity) for classifiers from both data sets and the large prevalence of black image corners in the HAM and ISIC training data, a correlation is not unlikely.</p>
        <p>As the segmentation step lies upstream of the classifier training and evaluation steps, the latter two are highly dependent on the output quality of the former. While the model employed in this study achieved a threshold Jaccard index lower than the score obtained by the ISIC 2018 challenge winners (0.75 vs 0.80), a general visual inspection of the segmentation masks suggested sufficient quality (ie, lesions visible with large portions of the background adequately removed). Further evaluation of its performance on an external data set (PH2) indicated that the segmentation model generalizes well and can be employed for segmenting images from external data sets. Assuming that classifier performance is partially indicative of segmentation performance, the segmentation model generalized adequately for HAM and PH2 images (known of course for the latter already due to the ground truth masks, but confirmed here again). In contrast, classifiers trained on segmented images performed worse on PROP with low mean balanced accuracies. Given that classifiers trained on unsegmented images did not suffer from this issue, insufficient segmentation masks are a possible candidate for the problem. This is, however, difficult to verify due to the nonexisting ground truth masks. This illustrates that the performance of segmented classifiers is ultimately tied to the performance of the segmentation model.</p>
        <p>In practice, identifying and fixing obviously faulty segmentation masks manually at test time should be feasible but may not be sufficient. As seen for the analysis of the PH2 set, where model segmentation masks were compared to ground truth segmentation masks, classifier performance may be strongly influenced by the precise way that the segmentation is done, with small differences causing large negative effects (see <xref rid="figure4" ref-type="fig">Figure 4</xref>). Training sets of automatically segmented images could contain their own kind of artifacts introduced by the automated segmentation process. We speculate that masks produced by the segmentation model have distinctive visual characteristics based on its training set and postprocessing methods. For instance, a certain amount of the adjacent skin may be included or the segmentation creates unique borders (eg, smoothness of edges). Any classifier trained on images with such segmentation masks might pick up on such subtleties and become susceptible to segmentation masks of a different variety.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Exemplary predictions of a classifier trained on unsegmented HAM (left) and ISIC (right) images and evaluated on PH2 images with different segmentation masks. PH2 images in the SM column were segmented using the segmentation model. PH2 images in the GT column were segmented using dermatologist-generated ground truth segmentation masks. The target class (ground truth) for each lesion is displayed to the left, with the classifier’s output probability for the target class on top. An output probability larger than 50% corresponds to a correct classification, which is also indicated by a blue frame, whereas an orange frame denotes an incorrect classification. GT: ground truth; HAM: human against machine data set; ISIC: international skin imaging collaboration data set; PH2: hospital Pedro Hispano data set; SM: segmentation model.</p>
          </caption>
          <graphic xlink:href="jmir_v23i3e21695_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Future Work and Limitations</title>
        <p>While the study aimed at only comparing the performance of 2 classification workflows where classifiers were trained on segmented/unsegmented images, there is notable performance variation dependent on the training and test sets. While the HAM training set contained more unique melanoma lesions (514 vs 374, Table S1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), the ISIC training data set contained more images of biopsy-verified lesions and thus, probably more borderline cases. These distinct features may be advantageous or detrimental for classifier performance on any given test set. Future work should address the issue of faulty segmentation masks and closely investigate the potential artifacts arising from an upstream segmentation step. As classification was done in a binary instead of a multi-class setting due to limited data availability, these findings might not generalize to a multi-class setting. Furthermore, performance was only shown here for 1 architecture; thus, generalizability to similar architectures, while expected, is not guaranteed.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Skin lesion classifiers trained and evaluated on segmented images have an overall comparable performance to classifiers trained and evaluated on unsegmented images that show the exact same lesion. In addition, segmentation comes with the added benefit of removing lesion-adjacent artifacts, which may act as confounding factors. However, this benefit comes at a cost, as classifier performance is tied to the segmentation quality. Further, image segmentation may introduce new pitfalls. Hence, further investigation is required to elucidate the effects of segmentation observed in this study.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary content.</p>
        <media xlink:href="jmir_v23i3e21695_app1.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HAM</term>
          <def>
            <p>human against machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ISIC</term>
          <def>
            <p>International Skin Imaging Collaboration</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PH2</term>
          <def>
            <p>hospital Pedro Hispano</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PROP</term>
          <def>
            <p>proprietary data set</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was funded by the Federal Ministry of Health, Berlin, Germany (grant: Skin Classification Project; grant holder: Titus J. Brinker, MD, German Cancer Research Center, Heidelberg, Germany). The sponsor had no role in the design and conduct of the study; collection, management, analysis, and interpretation of the data; preparation, review, or approval of the manuscript; and decision to submit the manuscript for publication.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>TJB reports owning a company that develops mobile apps (Smart Health Heidelberg GmbH, Handschuhsheimer Landstr. 9/1, 69120 Heidelberg). JSU is on the advisory board or has received honoraria and travel support from Amgen, Bristol Myers Squibb, GSK, LeoPharma, Merck Sharp and Dohme, Novartis, Pierre Fabre, Roche, outside the submitted work. No other disclosures were reported.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Esteva</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kuprel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Novoa</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Swetter</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Blau</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Thrun</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Dermatologist-level classification of skin cancer with deep neural networks</article-title>
          <source>Nature</source>
          <year>2017</year>
          <month>01</month>
          <day>25</day>
          <volume>542</volume>
          <issue>7639</issue>
          <fpage>115</fpage>
          <lpage>118</lpage>
          <pub-id pub-id-type="doi">10.1038/nature21056</pub-id>
          <pub-id pub-id-type="medline">28117445</pub-id>
          <pub-id pub-id-type="pii">nature21056</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haenssle</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Fink</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schneiderbauer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Toberer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Buhl</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kalloo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hassen</surname>
              <given-names>ABH</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Enk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Uhlmann</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Alt</surname>
              <given-names>Christina</given-names>
            </name>
            <name name-style="western">
              <surname>Arenbergerova</surname>
              <given-names>Monika</given-names>
            </name>
            <collab>Reader study level-I and level-II Groups</collab>
            <name name-style="western">
              <surname>Bakos</surname>
              <given-names>Renato</given-names>
            </name>
            <name name-style="western">
              <surname>Baltzer</surname>
              <given-names>Anne</given-names>
            </name>
            <name name-style="western">
              <surname>Bertlich</surname>
              <given-names>Ines</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>Andreas</given-names>
            </name>
            <name name-style="western">
              <surname>Bokor-Billmann</surname>
              <given-names>Therezia</given-names>
            </name>
            <name name-style="western">
              <surname>Bowling</surname>
              <given-names>Jonathan</given-names>
            </name>
            <name name-style="western">
              <surname>Braghiroli</surname>
              <given-names>Naira</given-names>
            </name>
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>Ralph</given-names>
            </name>
            <name name-style="western">
              <surname>Buder-Bakhaya</surname>
              <given-names>Kristina</given-names>
            </name>
            <name name-style="western">
              <surname>Buhl</surname>
              <given-names>Timo</given-names>
            </name>
            <name name-style="western">
              <surname>Cabo</surname>
              <given-names>Horacio</given-names>
            </name>
            <name name-style="western">
              <surname>Cabrijan</surname>
              <given-names>Leo</given-names>
            </name>
            <name name-style="western">
              <surname>Cevic</surname>
              <given-names>Naciye</given-names>
            </name>
            <name name-style="western">
              <surname>Classen</surname>
              <given-names>Anna</given-names>
            </name>
            <name name-style="western">
              <surname>Deltgen</surname>
              <given-names>David</given-names>
            </name>
            <name name-style="western">
              <surname>Fink</surname>
              <given-names>Christine</given-names>
            </name>
            <name name-style="western">
              <surname>Georgieva</surname>
              <given-names>Ivelina</given-names>
            </name>
            <name name-style="western">
              <surname>Hakim-Meibodi</surname>
              <given-names>Lara-Elena</given-names>
            </name>
            <name name-style="western">
              <surname>Hanner</surname>
              <given-names>Susanne</given-names>
            </name>
            <name name-style="western">
              <surname>Hartmann</surname>
              <given-names>Franziska</given-names>
            </name>
            <name name-style="western">
              <surname>Hartmann</surname>
              <given-names>Julia</given-names>
            </name>
            <name name-style="western">
              <surname>Haus</surname>
              <given-names>Georg</given-names>
            </name>
            <name name-style="western">
              <surname>Hoxha</surname>
              <given-names>Elti</given-names>
            </name>
            <name name-style="western">
              <surname>Karls</surname>
              <given-names>Raimonds</given-names>
            </name>
            <name name-style="western">
              <surname>Koga</surname>
              <given-names>Hiroshi</given-names>
            </name>
            <name name-style="western">
              <surname>Kreusch</surname>
              <given-names>Jürgen</given-names>
            </name>
            <name name-style="western">
              <surname>Lallas</surname>
              <given-names>Aimilios</given-names>
            </name>
            <name name-style="western">
              <surname>Majenka</surname>
              <given-names>Pawel</given-names>
            </name>
            <name name-style="western">
              <surname>Marghoob</surname>
              <given-names>Ash</given-names>
            </name>
            <name name-style="western">
              <surname>Massone</surname>
              <given-names>Cesare</given-names>
            </name>
            <name name-style="western">
              <surname>Mekokishvili</surname>
              <given-names>Lali</given-names>
            </name>
            <name name-style="western">
              <surname>Mestel</surname>
              <given-names>Dominik</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>Volker</given-names>
            </name>
            <name name-style="western">
              <surname>Neuberger</surname>
              <given-names>Anna</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>Kari</given-names>
            </name>
            <name name-style="western">
              <surname>Oliviero</surname>
              <given-names>Margaret</given-names>
            </name>
            <name name-style="western">
              <surname>Pampena</surname>
              <given-names>Riccardo</given-names>
            </name>
            <name name-style="western">
              <surname>Paoli</surname>
              <given-names>John</given-names>
            </name>
            <name name-style="western">
              <surname>Pawlik</surname>
              <given-names>Erika</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>Barbar</given-names>
            </name>
            <name name-style="western">
              <surname>Rendon</surname>
              <given-names>Adriana</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>Teresa</given-names>
            </name>
            <name name-style="western">
              <surname>Sadek</surname>
              <given-names>Ahmed</given-names>
            </name>
            <name name-style="western">
              <surname>Samhaber</surname>
              <given-names>Kinga</given-names>
            </name>
            <name name-style="western">
              <surname>Schneiderbauer</surname>
              <given-names>Roland</given-names>
            </name>
            <name name-style="western">
              <surname>Schweizer</surname>
              <given-names>Anissa</given-names>
            </name>
            <name name-style="western">
              <surname>Toberer</surname>
              <given-names>Ferdinand</given-names>
            </name>
            <name name-style="western">
              <surname>Trennheuser</surname>
              <given-names>Lukas</given-names>
            </name>
            <name name-style="western">
              <surname>Vlahova</surname>
              <given-names>Lyobomira</given-names>
            </name>
            <name name-style="western">
              <surname>Wald</surname>
              <given-names>Alexander</given-names>
            </name>
            <name name-style="western">
              <surname>Winkler</surname>
              <given-names>Julia</given-names>
            </name>
            <name name-style="western">
              <surname>Wölbing</surname>
              <given-names>Priscila</given-names>
            </name>
            <name name-style="western">
              <surname>Zalaudek</surname>
              <given-names>Iris</given-names>
            </name>
          </person-group>
          <article-title>Man against machine: diagnostic performance of a deep learning convolutional neural network for dermoscopic melanoma recognition in comparison to 58 dermatologists</article-title>
          <source>Ann Oncol</source>
          <year>2018</year>
          <month>08</month>
          <day>01</day>
          <volume>29</volume>
          <issue>8</issue>
          <fpage>1836</fpage>
          <lpage>1842</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0923-7534(19)34105-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/annonc/mdy166</pub-id>
          <pub-id pub-id-type="medline">29846502</pub-id>
          <pub-id pub-id-type="pii">S0923-7534(19)34105-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tschandl</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rosendahl</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Akay</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Argenziano</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Cabo</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gourhant</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kreusch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lallas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lapins</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Marghoob</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Menzies</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Neuber</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Paoli</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rabinovitz</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Rinner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scope</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Soyer</surname>
              <given-names>HP</given-names>
            </name>
            <name name-style="western">
              <surname>Sinz</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zalaudek</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kittler</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Expert-Level Diagnosis of Nonpigmented Skin Cancer by Combined Convolutional Neural Networks</article-title>
          <source>JAMA Dermatol</source>
          <year>2019</year>
          <month>01</month>
          <day>01</day>
          <volume>155</volume>
          <issue>1</issue>
          <fpage>58</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30484822"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamadermatol.2018.4378</pub-id>
          <pub-id pub-id-type="medline">30484822</pub-id>
          <pub-id pub-id-type="pii">2716294</pub-id>
          <pub-id pub-id-type="pmcid">PMC6439580</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brinker</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hekler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Enk</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Berking</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Haferkamp</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hauschild</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weichenthal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Klode</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schadendorf</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Holland-Letz</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>von Kalle</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fröhling</surname>
              <given-names>Stefan</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Utikal</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Deep neural networks are superior to dermatologists in melanoma image classification</article-title>
          <source>Eur J Cancer</source>
          <year>2019</year>
          <month>09</month>
          <volume>119</volume>
          <fpage>11</fpage>
          <lpage>17</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0959-8049(19)30349-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ejca.2019.05.023</pub-id>
          <pub-id pub-id-type="medline">31401469</pub-id>
          <pub-id pub-id-type="pii">S0959-8049(19)30349-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>Roman C</given-names>
            </name>
            <name name-style="western">
              <surname>Weichenthal</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Utikal</surname>
              <given-names>Jochen S</given-names>
            </name>
            <name name-style="western">
              <surname>Hekler</surname>
              <given-names>Achim</given-names>
            </name>
            <name name-style="western">
              <surname>Berking</surname>
              <given-names>Carola</given-names>
            </name>
            <name name-style="western">
              <surname>Hauschild</surname>
              <given-names>Axel</given-names>
            </name>
            <name name-style="western">
              <surname>Enk</surname>
              <given-names>Alexander H</given-names>
            </name>
            <name name-style="western">
              <surname>Haferkamp</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Klode</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schadendorf</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>Philipp</given-names>
            </name>
            <name name-style="western">
              <surname>Holland-Letz</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>Bastian</given-names>
            </name>
            <name name-style="western">
              <surname>von Kalle</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fröhling</surname>
              <given-names>Stefan</given-names>
            </name>
            <name name-style="western">
              <surname>Gaiser</surname>
              <given-names>Maria R</given-names>
            </name>
            <name name-style="western">
              <surname>Hartmann</surname>
              <given-names>Daniela</given-names>
            </name>
            <name name-style="western">
              <surname>Gesierich</surname>
              <given-names>Anja</given-names>
            </name>
            <name name-style="western">
              <surname>Kähler</surname>
              <given-names>Katharina C</given-names>
            </name>
            <name name-style="western">
              <surname>Wehkamp</surname>
              <given-names>Ulrike</given-names>
            </name>
            <name name-style="western">
              <surname>Karoglan</surname>
              <given-names>Ante</given-names>
            </name>
            <name name-style="western">
              <surname>Bär</surname>
              <given-names>Claudia</given-names>
            </name>
            <name name-style="western">
              <surname>Brinker</surname>
              <given-names>Titus J</given-names>
            </name>
            <collab>Collabrators</collab>
          </person-group>
          <article-title>Systematic outperformance of 112 dermatologists in multiclass skin cancer image classification by convolutional neural networks</article-title>
          <source>Eur J Cancer</source>
          <year>2019</year>
          <month>09</month>
          <volume>119</volume>
          <fpage>57</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0959-8049(19)30381-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ejca.2019.06.013</pub-id>
          <pub-id pub-id-type="medline">31419752</pub-id>
          <pub-id pub-id-type="pii">S0959-8049(19)30381-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Codella</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gutman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Emre</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Helba</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Marchetti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dusza</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kalloo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liopyris</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kittler</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Skin lesion analysis toward melanoma detection: A challenge at the 2017 International symposium on biomedical imaging (ISBI), hosted by the international skin imaging collaboration (ISIC)</article-title>
          <year>2018</year>
          <month>04</month>
          <day>04</day>
          <conf-name>IEEE 15th International Symposium on Biomedical Imaging (ISBI )</conf-name>
          <conf-date>2018</conf-date>
          <conf-loc>Washington, DC, USA</conf-loc>
          <fpage>168</fpage>
          <lpage>172</lpage>
          <pub-id pub-id-type="doi">10.1109/ISBI.2018.8363547</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tschandl</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rosendahl</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kittler</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The HAM10000 dataset, a large collection of multi-source dermatoscopic images of common pigmented skin lesions</article-title>
          <source>Sci Data</source>
          <year>2018</year>
          <month>08</month>
          <day>14</day>
          <volume>5</volume>
          <fpage>180161</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/sdata.2018.161"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2018.161</pub-id>
          <pub-id pub-id-type="medline">30106392</pub-id>
          <pub-id pub-id-type="pii">sdata2018161</pub-id>
          <pub-id pub-id-type="pmcid">PMC6091241</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mendonca</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Marques</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Marcal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rozeira</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>PH² - a dermoscopic image database for research and benchmarking</article-title>
          <source>Annu Int Conf IEEE Eng Med Biol Soc</source>
          <year>2013</year>
          <volume>2013</volume>
          <fpage>5437</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1109/EMBC.2013.6610779</pub-id>
          <pub-id pub-id-type="medline">24110966</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lapuschkin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wäldchen</surname>
              <given-names>Stephan</given-names>
            </name>
            <name name-style="western">
              <surname>Binder</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Montavon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Samek</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>Klaus-Robert</given-names>
            </name>
          </person-group>
          <article-title>Unmasking Clever Hans predictors and assessing what machines really learn</article-title>
          <source>Nat Commun</source>
          <year>2019</year>
          <month>03</month>
          <day>11</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>1096</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41467-019-08987-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-019-08987-4</pub-id>
          <pub-id pub-id-type="medline">30858366</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-019-08987-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC6411769</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zech</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Badgeley</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Costa</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Titano</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Oermann</surname>
              <given-names>EK</given-names>
            </name>
          </person-group>
          <article-title>Variable generalization performance of a deep learning model to detect pneumonia in chest radiographs: A cross-sectional study</article-title>
          <source>PLoS Med</source>
          <year>2018</year>
          <month>11</month>
          <volume>15</volume>
          <issue>11</issue>
          <fpage>e1002683</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pmed.1002683"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pmed.1002683</pub-id>
          <pub-id pub-id-type="medline">30399157</pub-id>
          <pub-id pub-id-type="pii">PMEDICINE-D-18-01277</pub-id>
          <pub-id pub-id-type="pmcid">PMC6219764</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Winkler</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Fink</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Toberer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Enk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Deinlein</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hofmann-Wellenhof</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lallas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stolz</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Haenssle</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Association Between Surgical Skin Markings in Dermoscopic Images and Diagnostic Performance of a Deep Learning Convolutional Neural Network for Melanoma Recognition</article-title>
          <source>JAMA Dermatol</source>
          <year>2019</year>
          <month>08</month>
          <day>14</day>
          <fpage>1135</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31411641"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamadermatol.2019.1735</pub-id>
          <pub-id pub-id-type="medline">31411641</pub-id>
          <pub-id pub-id-type="pii">2740808</pub-id>
          <pub-id pub-id-type="pmcid">PMC6694463</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Okur</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Turkan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A survey on automated melanoma detection</article-title>
          <source>Engineering Applications of Artificial Intelligence</source>
          <year>2018</year>
          <month>08</month>
          <volume>73</volume>
          <fpage>50</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1016/j.engappai.2018.04.028</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Codella</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Rotemberg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Tschandl</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Emre</surname>
              <given-names>Celebi M</given-names>
            </name>
            <name name-style="western">
              <surname>Dusza</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gutman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Helba</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kalloo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liopyris</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Marchetti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kittler</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Skin lesion analysis toward melanoma detection 2018: A challenge hosted by the International Skin Imaging Collaboration (ISIC)</article-title>
          <source>arXiv csCV</source>
          <access-date>2021-03-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1902.03368">http://arxiv.org/abs/1902.03368</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ronneberger</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Brox</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>U-Net: Convolutional Networks for Biomedical Image Segmentation</article-title>
          <year>2015</year>
          <month>10</month>
          <day>05</day>
          <conf-name>Medical Image Computing and Computer-Assisted Intervention – MICCAI 2015</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Munich, Germany</conf-loc>
          <fpage>234</fpage>
          <lpage>241</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-24574-4_28</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
