<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v28i1e71458</article-id>
      <article-id pub-id-type="pmid">41740143</article-id>
      <article-id pub-id-type="doi">10.2196/71458</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Temporal Annotation of German Clinical Language in Real and Synthetic Clinical Documents: Corpus Development and Baseline Tagger Validation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Sarvestan</surname>
            <given-names>Javad</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Chenyu</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Recski</surname>
            <given-names>Gabor</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Arzideh</surname>
            <given-names>Kamyar</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Modersohn</surname>
            <given-names>Luise</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Chair of Medical Informatics</institution>
            <institution>Institute for AI and Informatics in Medicine</institution>
            <institution>Technical University of Munich (TUM) university hospital</institution>
            <addr-line>Ismaninger Str. 22</addr-line>
            <addr-line>Munich, Bavaria, 81675</addr-line>
            <country>Germany</country>
            <phone>49 8941404320</phone>
            <email>luise.modersohn@tum.de</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8258-4366</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Hahn</surname>
            <given-names>Udo</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5052-0245</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Chair of Medical Informatics</institution>
        <institution>Institute for AI and Informatics in Medicine</institution>
        <institution>Technical University of Munich (TUM) university hospital</institution>
        <addr-line>Munich, Bavaria</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>JULIELab</institution>
        <institution>Friedrich Schiller University Jena</institution>
        <addr-line>Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Institute for Medical Informatics, Statistics and Epidemiology (IMISE)</institution>
        <institution>Leipzig University</institution>
        <addr-line>Leipzig</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Luise Modersohn <email>luise.modersohn@tum.de</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>25</day>
        <month>2</month>
        <year>2026</year>
      </pub-date>
      <volume>28</volume>
      <elocation-id>e71458</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>1</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>15</day>
          <month>2</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>12</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>31</day>
          <month>12</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Luise Modersohn, Udo Hahn. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 25.02.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2026/1/e71458" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Temporal information about patients constitutes a precious source for clinical decision-making and medical treatment. The automatic extraction of such data from unstructured clinical narratives requires time-annotated clinical reports and notes from which time-informed taggers can be learned. Unfortunately, the non-English clinical language community, the German one as a typical example, with only a few exceptions, generally lacks such time-annotated resources to train and evaluate temporal taggers.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>To overcome this metadata bottleneck, we developed a TimeML-conformant annotation schema for both temporal entities and temporal relations adapted to the needs of German medical language. Based on the annotations derived therefrom, we trained state-of-the-art baseline taggers to recognize temporal expressions in clinical documents.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Starting from temporal annotation guidelines for English clinical documents, we developed preliminary annotation guidelines for temporal named entities and temporal relations for the German language. These guidelines were subsequently refined and adapted to German clinical jargon, incorporating the work experience of 5 clinically trained annotators (students of medicine). For this task, we used randomly selected smaller subsets of 2 German clinical corpora—a real-world one (3000PA<sub>J</sub>) and a synthetic one (GraSCCo). Both corpora were annotated (3000PA<sub>J</sub> partially, GraSCCo completely), randomly selecting 10% of the documents as an agreement part on 3000PA<sub>J</sub>. To measure interannotator agreement (IAA), we computed pairwise <italic>F</italic><sub>1</sub>-scores. We used that metadata to develop BERT (Bidirectional Encoder Representations from Transformers)-based language models for the creation of time-sensitive baseline taggers. All annotations are based on TimeML, the international de facto standard for time information markup.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We created 3000PA<sub>J</sub>-temp, a time-annotated corpus of real clinical documents (which cannot be distributed because of the rigid privacy legislation enforced for German clinical data), and GraSCCo-temp, a synthetic one (which is publicly available without any restrictions). Based on the final guidelines, we achieved an IAA <italic>F</italic><sub>1</sub>-score of 0.9 on both corpora for the temporal named entity recognition task. For the temporal relation extraction task, the IAA on GraSCCo plummeted to an <italic>F</italic><sub>1</sub>-score of 0.57 and 0.41 on 3000PA<sub>J</sub>, respectively. Still, those results are comparable with English clinical datasets. Our baseline tagger for named entities reached <italic>F</italic><sub>1</sub>-scores between 0.64 and 0.85. For automatic relation extraction, we achieved <italic>F</italic><sub>1</sub>-scores ranging between 0.60 and 0.64.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We here introduce the first TimeML-compliant annotation scheme for time expressions occurring in German clinical language and apply it to 2 clinical corpora, one with nondistributable real clinical data, the other with distributable synthetic ones. The latter constitutes the first publicly accessible, temporally annotated clinical corpus for the German language. The time tagger trained on these datasets is the first of its kind, fully compliant with the TimeML markup language. The amounts of temporal metadata in our corpora are among the largest datasets ever produced for the clinical domain, both compared with English and German predecessors.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>natural language processing</kwd>
        <kwd>clinical NLP</kwd>
        <kwd>German clinical language</kwd>
        <kwd>corpus development</kwd>
        <kwd>temporal named entity</kwd>
        <kwd>temporal relations</kwd>
        <kwd>annotation guidelines</kwd>
        <kwd>annotation process</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Overview</title>
        <p>Information extraction is a field of natural language processing (NLP) that is concerned with automatically identifying mentions of entities of interest (so-called named entities) and semantic relations holding among them [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. In the medical domain, commonly researched named entity types are, for example, Symptom, Finding, Diagnosis, Disease, or Drug, that are conceptually linked via medically relevant semantic relation types, such as Drug – hasDosage – Dosage, Drug – hasEffectOn – Disease (examples are shown in <xref rid="figure1" ref-type="fig">Figures 1</xref>A and 1B). Whereas named entity types address the terminological level of medical knowledge, including its taxonomic structure, semantic relations help represent single pieces of factual knowledge (medical assertions or facts).</p>
        <p>Sets of medical entities and facts identified by information extraction tools form a bag of information units lacking further structure. One particularly important dimension to add structure to otherwise unrelated information pieces focuses on their temporal ordering on the time axis, a class of information we here refer to as temporal knowledge [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. Information about the temporal order of (clinical) events is crucial in a hospital setting, because, for example, a drug reported on admission has a medically different status compared with one prescribed at discharge. Ultimately, temporal knowledge can be used to visualize timelines of patients' histories, which might prove helpful for doctors in medical decision making and for nurses in their daily care routines. This type of knowledge can either be encoded in terms of the named entity types “Event” and “Temporal Expressions,” such as Date, Duration, and Time, and “temporal relations,” which impose a (temporal) ordering on named entities or semantic relations. For instance, we may state a temporal relation between named entities, such as AFTER (examples are shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>C), or between semantic relations, such as BEFORE (examples are shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>D).</p>
        <p>Prior to the automatic extraction of named entities, semantic and temporal relations, specialized classifiers (taggers) have to be pretrained or fine-tuned, typically using manually supplied annotations to guide the machine learning process. We here face a serious disparity between corpora for English and non-English languages (such as German, the focus of our work [<xref ref-type="bibr" rid="ref8">8</xref>]). Based on an extensive survey of temporal datasets and tagging tools in the Related Work section, we encounter a large number of temporally annotated resources for the English language, both for clinical and nonclinical domains, that have no comparable counterpart for the German (clinical and nonclinical) language. For German, such resources are scarce and, if available, rather small in the nonclinical domain, while in the clinical domain, they are almost nonexistent. Moreover, annotations obeying the full TimeML annotation language standard are entirely missing for German.</p>
        <p>Accordingly, in the Methods section, the unique contributions of this article are described in depth: (1) the provision of 2 clinical German-language corpora, a nondistributable real clinical corpus (3000PA<sub>J</sub>) and a distributable synthetic corpus (GraSCCo), both of which have been richly annotated, adhering to TimeML, the current meta-language standard for temporal annotations. 3000PA<sub>J</sub> and GraSCCo are the first corpora annotated with TimeML markup for the German language ever. (2) Exploiting these annotations, we trained the first transformer-based baseline taggers that automatically extract temporal information encoded in German clinical reports and notes. Up until now, transformer-based temporal taggers are not even available for the general German language (eg, covering news or social media content).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Examples for named entities, semantic, and temporal relations.</p>
          </caption>
          <graphic xlink:href="jmir_v28i1e71458_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>Temporal information about patients constitutes a precious source for clinical decision making and medical treatment. It forms cohesive ties between single factual statements by linking them via temporal relations (see the examples for AFTER and BEFORE in <xref rid="figure1" ref-type="fig">Figure 1</xref>), which are the basis for temporal reasoning (eg, AFTER (x,y) and AFTER (y,z) transitively imply AFTER (x,z)). The automatic extraction of such temporal data is a prerequisite for the overarching goal to automatically construct consistent, maximally complete, and chronologically coherent timelines of the patients' medical history from unstructured clinical documents and structured electronic medical records to help support medical diagnosis, treatment decisions, and prognosis [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref20">20</xref>].</p>
        <p>The automatic extraction of such temporal information from unstructured medical records (clinical reports, notes, or free text fields in the electronic medical record) requires language models trained on raw or metadata-enriched, that is, annotated, textual data. However, annotated temporal data resources are still quite rare and often seriously limited in size. Shortage of corpora with temporal metadata, however, directly hinders supervised learning of time-sensitive language models.</p>
        <p>The starting point of time-centered knowledge representation research dates back to Allen’s time algebra [<xref ref-type="bibr" rid="ref21">21</xref>], which was then adopted in the design of TimeML [<xref ref-type="bibr" rid="ref22">22</xref>], a specification and annotation language for temporal natural language utterances that combines temporal entities (Dates, Durations, Events, etc) and relations (eg, BEFORE, AFTER, OVERLAP); temporal relations impose temporal orderings on temporal entities. After years of experimentation, TimeML evolved into an ISO (International Organization for Standardization) standard as ISO-TimeML [<xref ref-type="bibr" rid="ref23">23</xref>]. Part of TimeML, and 2 of its historical predecessors, are TIDES TIMEX2 [<xref ref-type="bibr" rid="ref24">24</xref>] and TIMEX3 [<xref ref-type="bibr" rid="ref23">23</xref>], which are used to mark up explicit temporal expressions, such as time expressions, dates, durations, etc. <xref ref-type="table" rid="table1">Table 1</xref> illustrates the dominant role of TimeML as the representational foundation (markup or annotation language) for time-annotated corpora.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Time-focused (mostly English only) nonclinical corpus resources.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="170"/>
            <col width="150"/>
            <col width="130"/>
            <col width="120"/>
            <col width="280"/>
            <thead>
              <tr valign="top">
                <td>Corpus/(challenge) task (year)</td>
                <td>Functional characterization of (challenge) task</td>
                <td>Annotation language</td>
                <td>Text genre</td>
                <td>Size in tokens</td>
                <td>Type/number of metadata</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>TimeBank 1.1 [<xref ref-type="bibr" rid="ref25">25</xref>] (2003)</td>
                <td>N/A<sup>a</sup> (corpus)</td>
                <td>TimeML 1.1</td>
                <td>186 news articles</td>
                <td>68.5k</td>
                <td>13 temporal relation types: 5.1k temporal relation annotations; 11.2k annotation items, in total</td>
              </tr>
              <tr valign="top">
                <td>TimeBank 1.2 [<xref ref-type="bibr" rid="ref26">26</xref>] (2007); for error correction see the work of Ocal et al [<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                <td>N/A (corpus)</td>
                <td>TimeML 1.2</td>
                <td>186/183 news articles</td>
                <td>68.5k</td>
                <td>1.4k TIMEX3 annotations; 7.9k Event annotations; 13 temporal relation types (6.4k temporal relation annotations and 27.6k annotation items, in total)</td>
              </tr>
              <tr valign="top">
                <td>TimeBank-Dense [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>] (2014)</td>
                <td>N/A (corpus)</td>
                <td>Subset of TimeML 1.2</td>
                <td>36 news articles (subset of TimeBank 1.2)</td>
                <td>13.3k (estimated)</td>
                <td>0.3k TIMEX3 annotations; 1.7k Event annotations; 6 temporal relation types (12.7k [10.8k] temporal relation annotations; 14.7k annotation items, in total)</td>
              </tr>
              <tr valign="top">
                <td>TempEval-1 [<xref ref-type="bibr" rid="ref30">30</xref>] (2009)</td>
                <td>Temporal relation (TLink) identification</td>
                <td>Subset of TimeML 1.2 (TIMEX3, Event, TLink)</td>
                <td>182 news articles (subset of TimeBank 1.2)</td>
                <td>61.4k [<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                <td>6 temporal relation types: 5.8k temporal relation annotations; 13.9k annotation items, in total [<xref ref-type="bibr" rid="ref28">28</xref>]</td>
              </tr>
              <tr valign="top">
                <td>TempEval-2 [<xref ref-type="bibr" rid="ref32">32</xref>] (2010)</td>
                <td>TIMEX3 identification; Event identification; temporal relation (TLink) identification</td>
                <td>Subset of TimeML 1.2 (TIMEX3, Event, TLink)</td>
                <td>Same as TempEval-1</td>
                <td>63k</td>
                <td>6 temporal relation types: 4.9k temporal relation annotations; 12.7k annotation items, in total (English data only) [<xref ref-type="bibr" rid="ref28">28</xref>]</td>
              </tr>
              <tr valign="top">
                <td>TempEval-3 [<xref ref-type="bibr" rid="ref31">31</xref>] (2013)</td>
                <td>TIMEX3 extraction and normalization; Event extraction and classification; end-to-end temporal relation (TLink) identification</td>
                <td>Subset of TimeML 1.2 (TIMEX3, Event, TLink)</td>
                <td>182 news reports (TimeBank) + 73 news reports(tiny subset of≈1M)(AQUAINT [<xref ref-type="bibr" rid="ref33">33</xref>]);255 news articles, in total</td>
                <td>Gold: 61.4 k (TimeBank) + 6.4 k +34.0 k (tiny subset of AQUAINT [<xref ref-type="bibr" rid="ref33">33</xref>]) = 101.8k, in total; Silver: 666k (Gigaword [<xref ref-type="bibr" rid="ref32">32</xref>])</td>
                <td>13 temporal relation types (full TimeML set): 11.1k temporal relation annotations; 24.2k annotation items, in total (English data only) [<xref ref-type="bibr" rid="ref28">28</xref>]</td>
              </tr>
              <tr valign="top">
                <td>SemEval 2015 - TimeLine Task 4 [<xref ref-type="bibr" rid="ref34">34</xref>] (2015)</td>
                <td>Cross-document analysis of news articles to construct timelines for target events, that is, detecting, anchoring in time, and ordering events for a target entity</td>
                <td>Subset (and minor adaptation) of TimeML 1.2</td>
                <td>120 WikiNews articles, with 4 main topics: Apple, Airbus &#38; Boeing, General Motors, Chrysler &#38; Ford, stock market</td>
                <td>10k per main topic, 40k, in total</td>
                <td>0.9k Event annotations;0.7k Event chain annotations; 38 target entities; 37 timelines</td>
              </tr>
              <tr valign="top">
                <td>RED [<xref ref-type="bibr" rid="ref35">35</xref>] (2016)</td>
                <td>N/A (corpus)</td>
                <td>Subset of TimeML</td>
                <td>95 news articles and casual discussion forum chats</td>
                <td>54.3k tokens</td>
                <td>1.1k TIMEX3 annotations; 8.7k Event annotations; 5 TLink types (Before, Overlap, Begins_on, Ends_on, Simultaneous): 1.4k temporal relation annotations (TLinks)</td>
              </tr>
              <tr valign="top">
                <td>CaTeRS [<xref ref-type="bibr" rid="ref36">36</xref>] (2016)</td>
                <td>N/A (corpus)</td>
                <td>Event definition based on the TRIPS ontology; subset of TimeML TLINKs</td>
                <td>320 five-sentence short stories</td>
                <td>1600 sentences</td>
                <td>2.7k Event annotations;4 TLink types (Before, Overlaps, Contains, Identity): approximately 2.2k temporal relation annotations (TLinks) out of 2.7k causal and temporal relations</td>
              </tr>
              <tr valign="top">
                <td>Event StoryLine (ESC) v0.9 [<xref ref-type="bibr" rid="ref37">37</xref>] (2017)</td>
                <td>N/A (corpus)</td>
                <td>Compatible with TimeML</td>
                <td>258 news articles about calamityevents, that is, natural disasters, shootings, killings, accidents, trials, etc.</td>
                <td>N/A</td>
                <td>1.3k TIMEX3 annotations; 7.3k Event annotations; 4 TLink types (Before, After, Contains, Overlap): 6.9k temporal relation annotations (TLinks)</td>
              </tr>
              <tr valign="top">
                <td>Universal Decompositional Semantics Time (UDS-T) [<xref ref-type="bibr" rid="ref29">29</xref>] (2019)</td>
                <td>Categorical temporal relations are represented as real-valued relative timelines (on top of Universal Dependency parse trees)</td>
                <td>Mapping of events to their likely durations and event pairs as real-valued relative timelines</td>
                <td>Mixed Web documents (blog posts, newsgroup threads, emails, product reviews, and answers from QA websites) [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>254.8k tokens [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>32.3k Event annotations; 70.4k temporal relation annotations</td>
              </tr>
              <tr valign="top">
                <td>TDG [<xref ref-type="bibr" rid="ref39">39</xref>] (2020)</td>
                <td>N/A (corpus)</td>
                <td>Subset of TimeML + Temporal Dependency Graphs</td>
                <td>500 WikiNews articles</td>
                <td>Not reported</td>
                <td>2.5k TIMEX3 annotations; 15.0k Event annotations; 4 TLink types (Before, After, Overlap, Includes): 28.4k temporal relation annotations (TLinks)</td>
              </tr>
              <tr valign="top">
                <td>Maven-Ere [<xref ref-type="bibr" rid="ref40">40</xref>] (2022)</td>
                <td>N/A (corpus)</td>
                <td>Subset of TimeML: TIMEX3, TLink</td>
                <td>4480 Wikipedia articles</td>
                <td>Not reported</td>
                <td>25.8k TIMEX3 annotations; 6 TLink types (Before, Contains, Overlap, Begins_on, Ends_on, Simultaneous): 1216k temporal relation annotations (TLinks)</td>
              </tr>
              <tr valign="top">
                <td>TimeBankNT [<xref ref-type="bibr" rid="ref41">41</xref>] (2024)</td>
                <td>Full timeline annotation (all possible TLinks) of the sparse TLink TimeBankDense [<xref ref-type="bibr" rid="ref28">28</xref>] annotations</td>
                <td>Subset of TimeML: TIMEX3, Event, TLink</td>
                <td>36 news articles(subset of TimeBank 1.2)</td>
                <td>13.3k (estimated)</td>
                <td>0.3k TIMEX3 annotations; 1.7k Event annotations; 102.3k (104.8k) temporal relation annotations (TLinks)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The early TimeBank corpus [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>] witnessed the consolidation of TimeML over a decade. As an experimental vehicle, it is characterized by small document and token numbers as well as low amounts of annotated temporal data.</p>
        <p>A simplified version of expressionally rich TimeML became the metadata backbone for TempEval [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>], a series of time-focused shared task challenges run by NLP researchers within the framework of SemEval, a workshop series focusing on a broad range of semantic interpretation topics organized under the auspices of the Association for Computational Linguistics.</p>
        <p>Shared tasks, such as TempEval or SemEval, have become a major driver of progress for NLP [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. They are based on a common gold standard dataset on which several competing research group teams run their own systems against predefined tasks; their submitted solutions are, finally, compared against the gold standard, which yields a ranking of the teams involved based on their performance for specific tasks. Top-ranked teams are then given the opportunity at a closing workshop and invited to journal publications to feature the most successful methodologies—thus, continuously advancing the methodological repertoire of NLP on the basis of empirical evidence from benchmarking experiments.</p>
        <p>The TempEval-3 corpus [<xref ref-type="bibr" rid="ref31">31</xref>] was the largest in this series and contains 255 news articles, with roughly 95k tokens, selected from the TimeBank 1.2 corpus [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>] (183/186 articles) and the Aquaint corpus (73 news reports) [<xref ref-type="bibr" rid="ref33">33</xref>] (numbers slightly differ dependent on the cited literature); TimeBank-Dense [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>], its relationally richer successor, comes with a total of 12,715 temporal relations (more than 2 times the number of the original TimeBank corpus). Interestingly, the second edition of TempEval [<xref ref-type="bibr" rid="ref32">32</xref>] contained data not only for English, but also for Chinese, French, Italian, Korean, and Spanish, whereas the third edition [<xref ref-type="bibr" rid="ref31">31</xref>] dealt with English and Spanish data only. A variant of TempEval was considered in the Timeline Task 4 of SemEval 2015, which featured cross-document analysis of news articles to construct timelines for events [<xref ref-type="bibr" rid="ref34">34</xref>] described in a series of documents. For all 3 challenges in TempEval, 9 subtasks had to be tackled that fell into 3 categories: time expression identification (spans and TIMEX3 classes, such as Date, Time, Duration, etc), event expression identification (spans and Modality, Degree, Polarity, etc), and temporal relation identification (temporal relations, such as BEFORE, OVERLAP, AFTER, and a narrative container relation typed as CONTAINS).</p>
        <p>In an intermediary phase, new corpora were generated featuring different text genres (eg, user-generated contents [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref46">46</xref>], Wikipedia articles [<xref ref-type="bibr" rid="ref40">40</xref>]) and playing with different sets of temporal relations, yet with only insignificant growth of document sets or metadata volumes. One of the rare departures from strict adherence to TimeML can be found in the UDS-T corpus [<xref ref-type="bibr" rid="ref46">46</xref>], where TimeML’s categorical temporal relations are represented as real-valued relative timelines (on top of Universal Dependency parse trees). UDS-T also stands for a trend towards increasing quantities of documents/tokens (&#62;250k tokens) and metadata (&#62;100k annotation items). Truly impressive breakthroughs in both of these dimensions have been achieved only recently by getting large numbers of crowdworkers involved, such as for Maven-Ere [<xref ref-type="bibr" rid="ref40">40</xref>], which excels in, for example, more than a million temporal relation annotations. In addition, TimeBankNT [<xref ref-type="bibr" rid="ref41">41</xref>] increases the number of metadata by an order of magnitude (&#62;100k temporal relation annotations) relative to TimeBank-Dense. Almost all of the corpora in <xref ref-type="table" rid="table1">Table 1</xref> incorporate newswire/newspaper documents only (with some exceptions mentioned above). In contradistinction, <xref ref-type="table" rid="table2">Table 2</xref> features corpora with clinical contents.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Time-focused (English only) clinical corpus resources.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="230"/>
            <col width="180"/>
            <col width="130"/>
            <col width="140"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Corpus/(challenge) task (Year)</td>
                <td>Functional characterization of (challenge) task</td>
                <td>Annotation language</td>
                <td>Text genre</td>
                <td>Size in tokens</td>
                <td>Type/number of metadata</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>CLEF [<xref ref-type="bibr" rid="ref47">47</xref>] (2009)</td>
                <td>N/A<sup>a</sup> (corpus)</td>
                <td>TIMEX3 &#38; self-defined set of 8 temporal relations (Before, After, Overlap, Is_included, Ended_by, Begun_ by)</td>
                <td>50 clinical reports; 50 histopathology reports;50 imaging reports</td>
                <td>Not reported</td>
                <td>Clinical named entity types (Drug-or-Device, Intervention, Condition, Investigation, Locus, etc); 3.8k named entity annotations; clinical relation types (has_Target, has_Finding, has_Location, Modifies, etc); 2.4k clinical relation annotations; 0.5k temporal relation annotations (for 10 documents, only)</td>
              </tr>
              <tr valign="top">
                <td>i2b2 2012 [<xref ref-type="bibr" rid="ref48">48</xref>] (2013)</td>
                <td>Spans and types/attributes of temporal expressions (TIMEX3), referring to Dates, Times, Durations (incl. Normalization to ISO<sup>b</sup>8601 standard); Spans and types/attributes of Events, including. Both clinical concepts, such as Problems, Tests, Treatments, and Events relevant to the patient’s clinical timeline, such as Admissions, Transfers between departments; Temporal relations between the clinical Events and temporal expressions (Before, After, Overlap)</td>
                <td>Simplified version of TimeML adapted to clinical narratives and purposes (eg, the inclusion of clinical concepts, such as Problems, Tests, and Treatments, into Events) [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>310 discharge summaries</td>
                <td>About 178k tokens</td>
                <td>2.4k (train) + 1.8k (test) annotation units for temporal expressions (TIMEX3); 15.6k (train) + 13.6k (test) annotation units for temporal Events; 33.5k (train) + 27.7k (test) annotation units for temporal relations; 94.6k annotation units, in total</td>
              </tr>
              <tr valign="top">
                <td>THYME [<xref ref-type="bibr" rid="ref50">50</xref>] (2014)</td>
                <td>N/A (corpus)</td>
                <td>ISO-TimeML (THYME- TimeML) [<xref ref-type="bibr" rid="ref23">23</xref>]; TIMEX3, Event, 5 temporal relations (Before, Overlap, Begins_on, Ends_on, Contains)</td>
                <td>1254 clinical notes and pathology reports (oncology: brain cancer, colon cancer)</td>
                <td>Not reported</td>
                <td>Subset of the THYME colon cancer corpus (107 documents): 1.4k annotation units for temporal expressions (TIMEX3); 15.8k annotation units for temporal Events; 7.9k annotation units for temporal relations; 25.1k annotation units, in total</td>
              </tr>
              <tr valign="top">
                <td>Clinical TempEval-1, subbranch within TempEval as part of SemEval [<xref ref-type="bibr" rid="ref51">51</xref>] (2015) and Clinical TempEval-2 [<xref ref-type="bibr" rid="ref52">52</xref>] (2016)</td>
                <td>Spans and types/attributes of temporal expressions (TIMEX3), referring to Dates, Times, Durations, etc; Spans and types/attributes of Events, including both clinical concepts, such as Problems, Tests, Treatments; temporal relations between the clinical events and the document creation time (Before, After, Overlap, Before-Overlap) and narrative container relations</td>
                <td>Extension of TimeML for temporal expressions, medical events, and temporal relations between events and times (Styler et al [<xref ref-type="bibr" rid="ref50">50</xref>] shows the details of extensions of TimeML)</td>
                <td>591 clinical notes and pathology reports (colon cancer)</td>
                <td>Not reported</td>
                <td>7.9k annotation units for TIMEX3 time expressions; 78.9k annotation units for Events; 23.2k annotation units for temporal relations; 110.0k annotation units, in total</td>
              </tr>
              <tr valign="top">
                <td>Clinical TempEval-3 [<xref ref-type="bibr" rid="ref53">53</xref>] (2017)</td>
                <td>Same tasks as in Clinical TempEval-1 and Clinical TempEval-2</td>
                <td>Same annotation language as in Clinical TempEval-1 and Clinical TempEval-2</td>
                <td>Same colon cancer dataset as in Clinical TempEval-1 and Clinical TempEval-2 + a second dataset (595 documents) with focus on brain cancer</td>
                <td>Not reported</td>
                <td>(Virtually the same number of annotation items for colon cancer as in Clinical TempEval-1 and Clinical TempEval-2) 6.6k annotation units for TIMEX3 time expressions; 48.9k annotation units for Events; 7.3k annotation units temporal relations; 62.8k annotation units for colon cancer, in total; 172.8k annotation units; in total.</td>
              </tr>
              <tr valign="top">
                <td>n2c2 [<xref ref-type="bibr" rid="ref54">54</xref>], follow-up event of i2b2 2012 (2023)</td>
                <td>Identification of medication change (Event): determine the Action, Negation, Temporality, Certainty, and Actor for any change events (Context)</td>
                <td>Categories for temporality (Past, Present, Future, Unknown) are considerably coarser in granularity than those from the i2b2 2012 Shared Task and are not grounded in TimeML</td>
                <td>500 clinical notes (discharge summaries, correspondence notes)</td>
                <td>About 308k tokens (estimated from the study by Kumar et al [<xref ref-type="bibr" rid="ref55">55</xref>])</td>
                <td>About 1.7k annotation units</td>
              </tr>
              <tr valign="top">
                <td>CALEX[<xref ref-type="bibr" rid="ref56">56</xref>] (2019)</td>
                <td>N/A (corpus)</td>
                <td>TimeML-based TIMEX3 (Date, Time, Duration, Frequency) plus an extension (CALEX) for timeline construction based on calendar expressions</td>
                <td>180 discharge summaries, 53 psychiatry reports, 70 pediatrics reports, 75 emergency room reports, 378 clinical reports, in total</td>
                <td>55,433 (discharge summaries); 67,569 (psychiatry); 36,675 (pediatrics); 52,041 (emergency), 211.7k clinical reports, in total</td>
                <td>2378 TIMEX3 annotations</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>ISO: International Organization for Standardization.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The CLEF corpus [<xref ref-type="bibr" rid="ref47">47</xref>] was the first clinical time-focused dataset ever, with limited size though (150 documents, &#60;7k annotated items from which only a small fraction cover temporal information), restricted to TIMEX expressions, yet with a rich repertoire of named entities, (self-defined) semantic and temporal relations. It became the forerunner of the seminal THYME corpus [<xref ref-type="bibr" rid="ref50">50</xref>], a flagship enterprise that, unlike CLEF, fully adhered to TimeML representation conventions and came with roughly 1.3k clinical reports and slightly more than 25k temporal annotations on a 107-document subset thereof.</p>
        <p>Fortunately, the idea of challenge competitions also attracted clinical NLP researchers. Inspired by TempEval, temporal aspects were targeted within the i2b2 2012 Shared Task on Temporal Relations in Clinical Text [<xref ref-type="bibr" rid="ref48">48</xref>], here with focus on time information contained in clinical reports. Participating systems were required to extract virtually the same types of temporal knowledge as those targeted by TempEval:</p>
        <list list-type="order">
          <list-item>
            <p>Spans and types/attributes of temporal expressions, referring to Dates, Times, Durations, or frequency phrases in the clinical text (subsequently, the values of the extracted TIMEX temporal expressions had to be normalized to the ISO8601 specification standard).</p>
          </list-item>
          <list-item>
            <p>Spans and types/attributes of clinically significant events, including both clinical concepts (ie, named entities) such as Problems, Tests, Treatments, and ClinicalDepartments, and events relevant to the patient’s clinical timeline, such as Admissions, Transfers between departments.</p>
          </list-item>
          <list-item>
            <p>Temporal relations between the clinical events and temporal expressions.</p>
          </list-item>
        </list>
        <p>For these challenge tasks, the i2b2 2012 Shared Task organizers added a temporal annotation layer to the dataset, 310 discharge summaries (about 178k tokens), that had already been used in previous i2b2 rounds. For annotation purposes, a simplified version of TimeML was taken as a starting point, but had to be adapted to better suit clinical narratives and purposes (eg, the inclusion of clinical concepts, such as Problems, Tests, and Treatments, into Events) [<xref ref-type="bibr" rid="ref49">49</xref>]. The i2b2 2012 Shared Task corpus, finally, is accessible on the basis of signing a data use agreement and comes (for training) with 2366 annotation units for clinically relevant temporal expressions (TIMEX3 data), 15,567 annotation units for clinically relevant temporal events, and 33,543 annotation units for clinically relevant temporal relations; train and test data sum up to almost 95k annotation units. This landmark corpus exceeded previous annotation efforts in this field (most notably CLEF [<xref ref-type="bibr" rid="ref47">47</xref>]) both in terms of the number of annotated documents and annotation units by a large margin and became a benchmark for future research.</p>
        <p>Recently, a time-wise much narrower shared task devoted to medication change events documented in clinical notes was run within the context of n2c2, the follow-up event of i2b2 [<xref ref-type="bibr" rid="ref54">54</xref>]. Participants had to identify medication change (Event) and determine the Action, Negation, Temporality, Certainty, and Actor for any change events (Context). The categories for temporality (Past, Present, Future, Unknown; about 1.7k annotation units) are considerably coarser in granularity than those from the previous i2b2 2012 Shared Task and are not grounded in TimeML. An annotation effort that extends TIMEX3 expressions for timeline construction based on calendar expressions is reported by Viani [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <p>Complementary to these activities, within the TempEval branch of SemEval, a clinical TempEval subbranch was established. In the first 2 runs of this medically focused TempEval challenge [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>], roughly 600 deidentified clinical notes and pathology reports from colon cancer patients at Mayo Clinic were manually annotated with an extension of TimeML for temporal expressions, medical events, and temporal relations between events and times (details of the annotation process and extensions of TimeML as part of the THYME corpus are described by Styler et al [<xref ref-type="bibr" rid="ref50">50</xref>]). In the third run of TempEval [<xref ref-type="bibr" rid="ref53">53</xref>], this dataset was complemented by a second one with a focus on brain cancer, as the organizers wanted to explore the potential for domain adaptation, that is, how do systems trained on colon cancer data perform when tested on brain cancer data?</p>
        <p>The TimeML-annotated corpus from TempEval is available on a data use agreement basis as well, and comes (for colon cancer) with roughly 83k annotation units in its training (50%), and development (25%) splits, hence contains around 110k annotation units together with the held-out test set (25% of the entire dataset). For brain cancer, 48k annotation units are available for training (50%) and development (25%), and 15k in the test split, summing up to 63k, in total. Thus, the corpus from TempEval-3 exceeds the i2b2 2012 Shared Task corpus by slightly less than a factor of 2 in terms of annotation units and figures as the second milestone for temporal clinical corpora for the English language.</p>
        <p>All of the above-mentioned corpus building activities almost only cover the English (clinical) language. Since our work deals with German language data, <xref ref-type="table" rid="table3">Table 3</xref> gives an overview of the few efforts to deal with nonclinical German from a temporal perspective.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>German time-focused nonclinical resources (Corpora and Taggers).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="160"/>
            <col width="130"/>
            <col width="160"/>
            <col width="180"/>
            <col width="110"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td>Resource type</td>
                <td>Name of resource (Year)</td>
                <td>Functional characterization</td>
                <td>Annotation language</td>
                <td>Text genre</td>
                <td>Size in tokens</td>
                <td>Type/number of metadata</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Corpus</td>
                <td>EuroParl [<xref ref-type="bibr" rid="ref57">57</xref>] (2008)</td>
                <td>Time annotation mappings in parallel corpora: English → German</td>
                <td>Subset of TimeML: TIMEX3, Events, no temporal relations</td>
                <td>Transcribed speeches in the European Parliament</td>
                <td>960k bisentences (train) and 0.3k bisentences (dev/ test)</td>
                <td>Not reported</td>
              </tr>
              <tr valign="top">
                <td>Corpus</td>
                <td>WikiWarsDE [<xref ref-type="bibr" rid="ref58">58</xref>] (2011)</td>
                <td>N/A<sup>a</sup></td>
                <td>TIMEX2 [<xref ref-type="bibr" rid="ref22">22</xref>], a subset of TimeML restricted to dates, time expressions, and durations)</td>
                <td>22 German Wikipedia articles about famous wars in history corresponding to the English selection in WikiWars [<xref ref-type="bibr" rid="ref59">59</xref>]</td>
                <td>95.6k tokens</td>
                <td>2.2k TIMEX2 annotation units</td>
              </tr>
              <tr valign="top">
                <td>Corpus</td>
                <td>KRAUTS [<xref ref-type="bibr" rid="ref60">60</xref>] (2018)</td>
                <td>N/A</td>
                <td>TIMEX3</td>
                <td>192 newspaper articles</td>
                <td>75.7k tokens</td>
                <td>1.1k TIMEX3 annotation units</td>
              </tr>
              <tr valign="top">
                <td>Time tagger</td>
                <td>HeidelTime [<xref ref-type="bibr" rid="ref61">61</xref>] (2013)</td>
                <td>Rule-based tagger using gazetteers and regular expressions</td>
                <td>TIMEX2, TIMEX3 subset of TimeML plus normalizations into ISO<sup>b</sup> 8601 standard</td>
                <td>22 German Wikipedia articles about famous wars in history corresponding to the English selection in WikiWars [<xref ref-type="bibr" rid="ref59">59</xref>]</td>
                <td>100.7k tokens</td>
                <td>2.2k TIMEX2 annotation units</td>
              </tr>
              <tr valign="top">
                <td>Time tagger</td>
                <td>HeidelTimeext [<xref ref-type="bibr" rid="ref62">62</xref>] (2022)</td>
                <td>Extended rule-based tagger using gazetteers and regular expressions</td>
                <td>TIMEX3</td>
                <td>Mix of 10 parliament protocols, 10 books, 766 newspaper and 10 scholarly articles, 10k Wikipedia sentences</td>
                <td>5.121k tokens</td>
                <td>56.8k/53.8k TIMEX3 annotation units (automatically generated)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>ISO: International Organization for Standardization.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Three German-language corpora have been built with a focus on time information. EuroParl [<xref ref-type="bibr" rid="ref57">57</xref>] collects transcribed speeches (roughly 1m bisentences) from the European Parliament. TimeML-conformant temporal annotations are automatically mapped from English source texts to German targets. WikiWarsDE [<xref ref-type="bibr" rid="ref58">58</xref>] assembles 22 Wikipedia articles on famous wars; its time representations are restricted to TIMEX expressions. So is the annotation in KRAUTS [<xref ref-type="bibr" rid="ref60">60</xref>] based on 192 newspaper articles. For all 3 corpora, token counts do not exceed 100k, and at most, roughly 2k manual gold standard annotations are provided (HeidelTimeext [<xref ref-type="bibr" rid="ref62">62</xref>] offers a substantially larger yet automatically generated silver standard). Overall, these are, in comparison with the numbers in <xref ref-type="table" rid="table1">Table 1</xref>, tiny corpora with low annotation density and limited representational expressiveness (with the exception of Spreyer and Frank’s study [<xref ref-type="bibr" rid="ref57">57</xref>]).</p>
        <p>Two versions of the same time tagger also deserve mention. HeidelTime [<xref ref-type="bibr" rid="ref61">61</xref>] was originally built on English data and then augmented for tagging German data. HeidelTime is a classical rule-based system using regular expressions and additional gazetteers. The step from HeidelTime to HeidelTimeext [<xref ref-type="bibr" rid="ref62">62</xref>] comes with an augmented and updated rule set, an increase of the document size and token number (more than 5m tokens), and the number of temporal annotations (more than 50k items). However, in both cases, the representational expressiveness is limited to TIMEX expressions.</p>
        <p>The state of German-language clinical corpora with temporal metadata is basically a short story summarized in <xref ref-type="table" rid="table4">Table 4</xref>. The MACCS corpus [<xref ref-type="bibr" rid="ref63">63</xref>] is made of slightly more than 1.7k discharge summaries and clinical notes from the nephrology domain whose temporal annotations are based on a corpus-specific, that is, non–TimeML-conformant annotation language. Our work, instead, is fully TimeML-compliant and features 2 different corpora. 3000PA<sub>J</sub> comes with 1100 real clinical documents, 1.7M tokens, and 120k temporal annotations, whereas GraSCCo is a much smaller corpus product featuring 63 synthetic documents, 44k tokens, and almost 12k temporal annotation units. Due to rigid data privacy legislation in Germany, 3000PA<sub>J</sub> cannot be made publicly available, whereas GraSCCo can (it consists of fictitious clinical data). With roughly 131k annotation items, however, both corpora not only exceed all German-language corpora (whether clinical or nonclinical) in terms of temporal metadata but also all clinical English time-focused corpora, with one exception—only the million-scale nonclinical Maven-Ere corpus [<xref ref-type="bibr" rid="ref40">40</xref>] offers a (much) larger number of temporal annotations.</p>
        <p>How do 3000PA<sub>J</sub> and GraSCCo compare with other non-English clinical corpora annotated with temporal metadata? <xref ref-type="table" rid="table5">Table 5</xref> lists such textual resources whose size exceeds 50 documents and 1k annotation units. Perhaps, the closest in kinship is the French MERLOT corpus [<xref ref-type="bibr" rid="ref64">64</xref>] that also adheres to TimeML specifications but falls behind by orders of magnitude both in terms of tokens and the amount of temporal metadata. Three other French corpora [<xref ref-type="bibr" rid="ref65">65</xref>-<xref ref-type="bibr" rid="ref67">67</xref>] are much smaller than MERLOT and also contain fewer temporal annotations; only Bannour et al [<xref ref-type="bibr" rid="ref66">66</xref>] adheres to TimeML, including temporal relations. From 4 Chinese corpora, only the work of Liu et al [<xref ref-type="bibr" rid="ref68">68</xref>] contains TimeML specifications for TIMEX3 expressions and temporal relations, yet on a much smaller scale than 3000PA<sub>J</sub>, both document, token, and metadata-wise. Pan et al [<xref ref-type="bibr" rid="ref69">69</xref>] and Liu et al [<xref ref-type="bibr" rid="ref70">70</xref>] focus on TIMEX3 expressions only (Liu et al [<xref ref-type="bibr" rid="ref70">70</xref>] offering the largest corpus in terms of the number of documents, yet not of the number of annotation items), whereas Hu et al [<xref ref-type="bibr" rid="ref71">71</xref>] use a self-supplied time ontology for annotation. Swedish [<xref ref-type="bibr" rid="ref72">72</xref>], Portuguese [<xref ref-type="bibr" rid="ref73">73</xref>], Spanish [<xref ref-type="bibr" rid="ref17">17</xref>], and Italian [<xref ref-type="bibr" rid="ref74">74</xref>] resources are tiny in terms of the number of documents and annotation items they contain (in the range of less than some hundred documents) and the number of temporal relations (less than 5k, if at all). Finally, Cheng et al [<xref ref-type="bibr" rid="ref75">75</xref>] contain 2.6k THYME-conformant temporal relation annotations from a Japanese corpus based on slightly more than 1k documents. Another Japanese corpus, MedTxt-CR-JA [<xref ref-type="bibr" rid="ref76">76</xref>], comes with 27.4k temporal relation annotations that are inferred from 2.6k explicitly annotated start-point annotations. TIMEX3-only annotations are provided by Hamon et al [<xref ref-type="bibr" rid="ref65">65</xref>], Jeyafreeda et al [<xref ref-type="bibr" rid="ref67">67</xref>], Pan et al [<xref ref-type="bibr" rid="ref69">69</xref>], and Velupillai [<xref ref-type="bibr" rid="ref72">72</xref>]. With the exception of the multilingual E3C corpus [<xref ref-type="bibr" rid="ref77">77</xref>] (composed of French, Spanish, Basque, and Italian clinical case reports which differ significantly in style and format from real clinical reports), none of these corpora is publicly available.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>German time-focused clinical corpus resources with our own contribution highlighted.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="90"/>
            <col width="110"/>
            <col width="170"/>
            <col width="180"/>
            <col width="150"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td>Resource type</td>
                <td>Name of resource (Year)</td>
                <td>Annotation language</td>
                <td>Text genre</td>
                <td>Size in tokens</td>
                <td>Type/number of metadata</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Corpus</td>
                <td>MACSS [<xref ref-type="bibr" rid="ref63">63</xref>] (2016)</td>
                <td>Corpus-specific, that is, non-TimeML-conformant temporal annotations: time points, dates, temporal courses</td>
                <td>118 discharge summaries;1607 clinical notes from the nephrology domain (kidney transplantations)</td>
                <td>89.7k tokens; 68.5k tokens</td>
                <td>Not reported</td>
              </tr>
              <tr valign="top">
                <td>Corpus</td>
                <td>3000PA<sub>J</sub> (our work)<sup>a</sup></td>
                <td>TimeML:TIMEX3, Events, Six temporal relations (Before/After, Contains, Overlap, Begins_on, Ends_on)</td>
                <td>1100 real clinical documents, mostly discharge summaries</td>
                <td>1.7M tokens<sup>a</sup></td>
                <td>13.2k annotation units for TIMEX3 time expressions; 46.9k annotation units for Events; 59.1k annotation units for temporal relations; 119.2k<sup>a</sup> annotation units, in total</td>
              </tr>
              <tr valign="top">
                <td>Corpus</td>
                <td>GraSCCo (our work)<sup>a</sup></td>
                <td>TimeML:TIMEX3, Events, Six temporal relations (Before/After, Contains, Overlap, Begins_on, Ends_on)</td>
                <td>63 synthetic clinical documents</td>
                <td>44k tokens<sup>a</sup></td>
                <td>1.2k annotation units for TIMEX3 time expressions; 4.5k annotation units for Events; 5.8k annotation units for temporal relations; 11.6k<sup>a</sup> annotation units, in total</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Our own contribution.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Non-English and non-German time-focused clinical corpus resources.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="130"/>
            <col width="250"/>
            <col width="190"/>
            <col width="130"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Natural language (ISO<sup>a</sup> 639 codes)</td>
                <td>Name of resource (Year)</td>
                <td>Annotation language</td>
                <td>Text genre</td>
                <td>Size in tokens</td>
                <td>Type/number of metadata</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>FR</td>
                <td>No name [<xref ref-type="bibr" rid="ref65">65</xref>] (2014)</td>
                <td>TIMEX3 expressions (plus normalizations)</td>
                <td>182 clinical records (train) and 120 records (test, 25 with reference annotations), 302 records, in total</td>
                <td>Not reported</td>
                <td>Not reported</td>
              </tr>
              <tr valign="top">
                <td>SV</td>
                <td>Stockholm EPR [<xref ref-type="bibr" rid="ref72">72</xref>] (2014)</td>
                <td>TIMEX3 expressions</td>
                <td>112 clinical notes from an ICU<sup>b</sup> unit</td>
                <td>≈50k (estimate)</td>
                <td>&#60;2k TIMEX annotations</td>
              </tr>
              <tr valign="top">
                <td>ZH</td>
                <td>CMedTEX [<xref ref-type="bibr" rid="ref70">70</xref>] (2016)</td>
                <td>Simplified TimeML TIMEX3 expressions: Date, Time, Duration, and Frequency (plus ISO8601 normalizations)</td>
                <td>1778 clinical notes</td>
                <td>Not reported</td>
                <td>46.6k TIMEX3 annotations</td>
              </tr>
              <tr valign="top">
                <td>PT</td>
                <td>No name [<xref ref-type="bibr" rid="ref73">73</xref>] (2018)</td>
                <td>TimeML TIMEX3: Date, Time, Duration, Set (plus ISO8601 normalizations)</td>
                <td>130 discharge summaries</td>
                <td>Not reported</td>
                <td>Not reported</td>
              </tr>
              <tr valign="top">
                <td>FR</td>
                <td>MERLOT [<xref ref-type="bibr" rid="ref64">64</xref>] (2018)</td>
                <td>Simplified TimeML: Date, Time, Duration, and Frequency; 6 TimeML-compliant temporal relations: Before, Begins_on, Ends_on, During, Overlap, Simultaneous</td>
                <td>500 discharge summaries, procedure reports (eg, radiology reports), physician letters, and prescriptions</td>
                <td>148.5k</td>
                <td>3.9k temporal entity annotations; 4.6k temporal relation annotations</td>
              </tr>
              <tr valign="top">
                <td>ZH</td>
                <td>No name [<xref ref-type="bibr" rid="ref68">68</xref>] (2019)</td>
                <td>Three TimeML-compatible temporal relations: Before, After, Simultaneous</td>
                <td>563 clinical notes</td>
                <td>Not reported</td>
                <td>4.0k temporal expressions (ako TIMEX3 expression); 4.0k time intervals (relations)</td>
              </tr>
              <tr valign="top">
                <td>IT</td>
                <td>No name [<xref ref-type="bibr" rid="ref74">74</xref>] (2019)</td>
                <td>THYME-conformant clinical events (Problems, Tests, Treatments, Occurrences) and temporal relations (Before, Before/Overlap, Overlap, After)</td>
                <td>75 clinical reports</td>
                <td>57,263</td>
                <td>4.4k temporal relation annotations</td>
              </tr>
              <tr valign="top">
                <td>ES</td>
                <td>No name [<xref ref-type="bibr" rid="ref17">17</xref>] (2020)</td>
                <td>TIMEX3 expressions (plus expression normalization) and TimeML-noncompliant temporal relations</td>
                <td>50 clinical notes and 50 clinical reports for TIMEX3 identification &#38; 100 clinical notes and 100 clinical reports for temporal relation identification, 300 documents, in total</td>
                <td>Not reported</td>
                <td>TIMEX3 annotations not reported; 200 temporal relations</td>
              </tr>
              <tr valign="top">
                <td>ZH</td>
                <td>TNorm [<xref ref-type="bibr" rid="ref69">69</xref>] (2020)</td>
                <td>TimeML-compliant TIMEX3 (plus expression normalization) only, no temporal relations</td>
                <td>900 discharge summaries</td>
                <td>Not reported</td>
                <td>12.1k TIMEX3 annotations</td>
              </tr>
              <tr valign="top">
                <td>ZH</td>
                <td>No name [<xref ref-type="bibr" rid="ref71">71</xref>] (2022)</td>
                <td>Self-designed Clinical Time Ontology as a basis for an OWL-based temporal logic, with 11 temporal classes (various types of Instants, Intervals, Instant and Interval Collections, and Modifiers) and 16 temporal relations (extension of Allen’s 13 relations set)</td>
                <td>300 case reports containing 3000 clinical statements (presumably sentences)</td>
                <td>Not reported</td>
                <td>3.5k temporal entity annotations; 3.0k temporal relation annotations; 6.5k annotation units, in total</td>
              </tr>
              <tr valign="top">
                <td>JA</td>
                <td>No name [<xref ref-type="bibr" rid="ref75">75</xref>] (2022)</td>
                <td>THYME-compliant, simplified annotation schema: TIMEX3 + 5 temporal relations: On, Before, After, Start, Finish (complemented by 5 medical relations: Change, Compare, Feature, Region, Value)</td>
                <td>1000 radiography interpretation reports of lung cancer + 156 medical history reports of idiopathic pulmonary fibrosis</td>
                <td>Not reported</td>
                <td>2.6k temporal relation annotations</td>
              </tr>
              <tr valign="top">
                <td>FR, ES, IT, EU</td>
                <td>E3C [<xref ref-type="bibr" rid="ref77">77</xref>] (2023)</td>
                <td>THYME-conformant annotation: TIMEX3 expressions, Events, temporal relations</td>
                <td>81 French and Spanish, 86 Italian, and 90 Basque clinical case reports + 615 clinical case reports with silver standard (automatic) annotations</td>
                <td>French: 25,196; Spanish: 24,681; Italian: 24,319; Basque: 22,505 + &#62;200k (silver standard)</td>
                <td>French: 0.3k TIMEX3, 4.3k Event, 4.0k temporal relation annotations; Spanish: 0.4k TIMEX3, 4.8k Event, 4.7k temporal relation annotations; Italian: 0.3k TIMEX3, 3.4k Event, 1.2k temporal relation annotations; Basque: 0.6k TIMEX3, 7.9k Event, 8.0k temporal relation annotations</td>
              </tr>
              <tr valign="top">
                <td>FR</td>
                <td>No name [<xref ref-type="bibr" rid="ref66">66</xref>] (2023)</td>
                <td>Subset of TimeML Document; Creation Time and 5 temporal relations: Before, Before_Overlap, Overlap, and After + TemporalReference (noncompliant with TimeML)</td>
                <td>220 (train) + 57 (test) clinical reports</td>
                <td>Not reported</td>
                <td>2.9k temporal relation annotations</td>
              </tr>
              <tr valign="top">
                <td>JA</td>
                <td>MedTxt-CR-JA [<xref ref-type="bibr" rid="ref76">76</xref>] (2024)</td>
                <td>Start-point ordering of events from which 3 temporal relations can be inferred: Before, Equal, and After</td>
                <td>62 (from 148) case reports</td>
                <td>Not reported</td>
                <td>27.4k temporal relation annotations (based on 2.6k explicitly annotated start-point annotations)</td>
              </tr>
              <tr valign="top">
                <td>FR</td>
                <td>No name [<xref ref-type="bibr" rid="ref67">67</xref>] (2024)</td>
                <td>Corpus-specific, that is, non-TimeML-conformant temporal annotations: Date, Time, Frequency, Duration, and Age</td>
                <td>150 (train) + 50 (test) clinical notes</td>
                <td>Not reported</td>
                <td>0.4k temporal entity annotations</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>ISO: International Organization for Standardization.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>ICU: intensive care unit.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Goals of This Work</title>
        <p>As stated above, temporal knowledge, its annotation, and automatic extraction in the medical domain have almost only been researched in depth in the Anglo-American language community. The non-English clinical language community is basically a low-/nonresource area that, with only a few exceptions, generally lacks temporal metadata. In this article, we propose a 2-fold solution, specifically responding to the strict privacy legislation constraints in the European part of the world.</p>
        <p>The unique contributions of this article are the following: We provide temporal annotations for German clinical documents, including quality checks via interannotator agreement (IAA) metrics. More specifically, we supply temporal annotations for a nondistributable corpus composed of real clinical documents and a publicly distributable corpus composed of synthetic clinical documents. Furthermore, we train transformer-based baseline taggers to automatically extract temporal information encoded in German clinical reports and notes.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>In this section, we will give a detailed overview of our 2 clinical corpora, the annotation schema for temporal named entities and relations, the annotation process and its evaluation, as well as the presentation of our baseline time tagging model for clinical documents. <xref rid="figure2" ref-type="fig">Figure 2</xref> summarizes our experimental setting and illustrates the key steps in our workflow.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Overview of the experimental setup and workflow. BOHB: Bayesian Optimization and Hyperband; GBERT: German BERT model.</p>
          </caption>
          <graphic xlink:href="jmir_v28i1e71458_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The usage of 3000PA<sub>J</sub> is based on the approval by Jena University Hospital ethics committee (4639-12/15) and its data protection officer. The data was collected during the routine clinical care of adults at the intensive care unit or internal medicine ward. All persons were deceased at the time of data collection, thus no informed consent was needed for local data analysis according to the German law at that time. All data were hosted, annotated, and processed at the premises on secure servers with access restrictions and regular data protection training of the annotators. For GraSCCo, no ethics approval is needed as this dataset contains only fictional data written in the style of real clinical documents.</p>
      </sec>
      <sec>
        <title>Clinical Data Resources</title>
        <p>For temporal annotation, we used the 2 corpora already introduced in <xref ref-type="table" rid="table4">Table 4</xref>, namely 3000PA<sub>J</sub> and GraSCCo. 3000PA<sub>J</sub>, a subset of the 3000PA corpus [<xref ref-type="bibr" rid="ref78">78</xref>], consists of about 1100 real, that is, authentic, clinical documents, mostly discharge summaries, with roughly 145k sentences and 1.7m tokens hosted by the Jena University Hospital under strict access restrictions. In effect, this means that according to German data protection legislation, this dataset cannot be made available for public use outside the walls of the Jena University Hospital. 3000PA<sub>J</sub> has already been annotated at multiple semantic layers, including section headings [<xref ref-type="bibr" rid="ref79">79</xref>], Personally Identifiable Information [<xref ref-type="bibr" rid="ref80">80</xref>], medications [<xref ref-type="bibr" rid="ref78">78</xref>], and major nontemporal clinical named entities, namely diagnoses, findings, and symptoms [<xref ref-type="bibr" rid="ref81">81</xref>].</p>
        <p>As an alternative to siloing much-wanted clinical data in the barred 3000PA<sub>J</sub> dataset, we developed GraSCCo [<xref ref-type="bibr" rid="ref82">82</xref>], a synthetic twin corpus which is open for use to the entire clinical NLP community without any access restrictions. Albeit being a tiny document collection with only 63 German multiply-alienated and noise-infused real documents with about 5.4k sentences and 44k tokens, it is available via the Creative Commons license on Zenodo [<xref ref-type="bibr" rid="ref83">83</xref>]. As a noteworthy remark, the authors have already gathered preliminary evidence that GraSCCo may act as a reasonable substitute for 3000PA in terms of clinical language use and genre patterns [<xref ref-type="bibr" rid="ref82">82</xref>]. This observation is fully consistent with other experimental results for various languages, which show that synthetic corpora can indeed replace real clinical corpora with only marginal quality loss regardless of the application tasks and clinical text genres chosen (see, eg, the evidence found for English [<xref ref-type="bibr" rid="ref84">84</xref>-<xref ref-type="bibr" rid="ref86">86</xref>], French [<xref ref-type="bibr" rid="ref87">87</xref>], and Norwegian [<xref ref-type="bibr" rid="ref88">88</xref>]).</p>
      </sec>
      <sec>
        <title>Temporal Annotation</title>
        <sec>
          <title>Overview</title>
          <p>Manually generating temporal annotations is well-known as a notoriously complex and time-consuming task [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]. Hence, to avoid cognitive overload of the human annotators, we split our annotation campaign into 2 separate phases—an entity annotation and a relation annotation phase. Both followed the same schema (<xref rid="figure3" ref-type="fig">Figure 3</xref> depicts one phase equals a complete cycle) and were performed by at least 3 different annotators. This organizational scheme follows the widely acknowledged annotation conventions established by James Pustejovsky and Amber Stubbs [<xref ref-type="bibr" rid="ref89">89</xref>]. Generally speaking, at least 3 independent annotators are necessary to run a proper statistical analysis. All of our annotators were qualified medical students who had already passed their first medical exam after 2 years of study (Physikum, in German).</p>
          <p>Each annotation cycle was divided into a training-only and a production annotation phase. During the training phase, all annotators received the same partition of the entire dataset for annotation, usually about ten documents. Once this batch was completed, their annotations were checked both automatically via an IAA metric based on the average of the pairwise <italic>F</italic><sub>1</sub>-scores, and manually to identify and resolve individual/systematic errors and misunderstandings. The results of the latter phase were then discussed within the annotation team and led to changes in the annotation guidelines, if needed (typical shortcomings arising from premature annotation guidelines are a lack of clarity or ambiguity of instructions, instruction gaps, etc). After that, a new subset was drawn and, again, annotated by all annotators. These training iterations continued until the <italic>F</italic><sub>1</sub>-score, primarily the pairwise <italic>F</italic><sub>1</sub>-score as well as the averaged <italic>F</italic><sub>1</sub>-score, stabilized and reached a reasonable, that is, community-wide accepted, plateau (in the range of 0.9 on a scale of 0 to 1.0 agreement) [<xref ref-type="bibr" rid="ref90">90</xref>]. After this preparatory phase, the final guidelines were frozen and applied to the entire dataset, again, with a randomly chosen partition as the agreement portion, usually 5% to 10% of all documents. These documents will be called agreement documents, as they are the documents on which the IAA is calculated. The final <italic>F</italic><sub>1</sub>-score was determined on these agreement documents and reported as the final agreement value.</p>
          <p>Once the entity annotation task was completed, we unified all annotations of all agreement documents. Thus, label disagreements and missing annotations were detected. These merged entity annotations with all their identified disagreements were then used for the second phase, the relation annotation, and manually corrected by the human annotators. The annotators were also encouraged to modify/correct entity annotations if they disagreed with the results of the first entity-focused round.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Schema of the iterative workflow for annotation guideline development. The optimization cycle is repeated until a stopping criterion is reached on a document subset, mostly a predefined IAA threshold or the number of iterations. The final guideline is subsequently used to annotate the entire corpus in the production phase. IAA: interannotator agreement.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e71458_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Temporal Entity Definition</title>
          <p>Our definitions of time-related entities are identical to THYME [<xref ref-type="bibr" rid="ref50">50</xref>]. Accordingly, those entities are defined as follows:</p>
          <list list-type="bullet">
            <list-item>
              <p>EVENT: Any token or phrase that is related to things that occurred or happened.</p>
            </list-item>
            <list-item>
              <p>TIMEX3: Any token or short phrase that denotes a time expression of the following subtypes:</p>
              <list>
                <list-item>
                  <p>Date: Expressions or phrases that describe a time with accuracy up to a day (06/2020, next Wednesday),</p>
                </list-item>
                <list-item>
                  <p>Time: A specific time of the day (12 am, midnight),</p>
                </list-item>
                <list-item>
                  <p>Duration: A time frame (until yesterday, for 10 minutes),</p>
                </list-item>
                <list-item>
                  <p>Set: A recurring event (twice a day, 1-0-0),</p>
                </list-item>
                <list-item>
                  <p>Quantifier: The number of times something has happened or occurred, needs to be paired with an EVENT (second cycle of chemotherapy),</p>
                </list-item>
                <list-item>
                  <p>PrePost: Expressions like postoperative or premenarche.</p>
                </list-item>
              </list>
            </list-item>
          </list>
          <p>Additionally, entities annotated as an EVENT needed to be marked with one of the following tags according to their point in time with respect to the reported hospital stay: BEFORE (if something happened prior to admission), BEFORE-OVERLAP (if something occurred before but is still present at the time the patient was admitted to the hospital), OVERLAP (if something happened during the hospital stay) and AFTER (if occurrences will happen in the future after the discharge). An example of said annotated entities can be found in <xref rid="figure4" ref-type="fig">Figure 4</xref>.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Sentences to illustrate the annotation of entities annotated with the BRAT annotation tool. Yellow indicates EVENTS, blue stands for TIMEX3 temporal expressions. The labels are written over the marked words or phrases.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e71458_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Temporal Relation Definition</title>
          <p>Temporal entities themselves do not contain sufficient information for the adequate construction of timelines. Without context or ordering information, most of the time-relevant information is missing. Accordingly, temporal relations between those entities have to be determined. All of the relation types we chose are a subset of Allen's interval algebra [<xref ref-type="bibr" rid="ref21">21</xref>]. We followed the definitions in THYME [<xref ref-type="bibr" rid="ref50">50</xref>] and used the following relation types:</p>
          <list list-type="bullet">
            <list-item>
              <p>BEFORE (X,Y) X happened entirely before Y</p>
            </list-item>
            <list-item>
              <p>(AFTER (Y,X) is treated as the inverse of BEFORE (X,Y))</p>
            </list-item>
            <list-item>
              <p>CONTAINS (X,Y) Y happened entirely during X</p>
            </list-item>
            <list-item>
              <p>OVERLAP (X,Y) X and Y share a common partition of time</p>
            </list-item>
            <list-item>
              <p>BEGINS-ON (X,Y) X started with Y</p>
            </list-item>
            <list-item>
              <p>ENDS-ON (X,Y) X finished with Y</p>
            </list-item>
          </list>
          <p>In contrast to THYME and more in line with the i2b2 2012 guidelines, we have instructed our annotators to link each entity to at least one other entity in such a way that each entity is connected to every other entity via a path. This way, we ended up with a connected temporal graph where the entities are the vertices and the relations are represented as edges. This condition is crucial, however, to create a timeline of the entire hospital stay in later processing stages. In contrast to i2b2 2012, we did not use direct connections with the document time or hospital stay (time). This was already covered in the named entity phase by encoding the respective Event tag. <xref rid="figure5" ref-type="fig">Figure 5</xref> demonstrates the application of our annotation conventions to the sentences with already annotated named entities from <xref rid="figure4" ref-type="fig">Figure 4</xref>.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Extension of the already annotated named entities from Figure 4 with temporal relations using the BRAT annotation tool. The arrows indicate the relation together with its relation type.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e71458_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Evaluation Methods</title>
          <p>To determine the IAA scores in our temporal named entity annotation campaign, we calculated the mean of the pairwise precision, recall, and <italic>F</italic><sub>1</sub>-score for the annotated entities. The implementation we used can be found on GitHub [<xref ref-type="bibr" rid="ref91">91</xref>].</p>
          <p>In contrast to temporal named entities, temporal relations need a different treatment for their evaluation. Every entity has temporal connections to every other entity. However, annotating the entire fully connected temporal graph is not feasible, since the number of temporal relations grows quadratically with the number of event mentions (by anchoring events in time, however, annotation of temporal relations indeed scales linearly with the number of events [<xref ref-type="bibr" rid="ref92">92</xref>]). Thus, each annotator was encouraged to annotate the least possible number of relational edges, resulting in something akin to a minimum spanning tree. To guide the annotators towards this goal, they were instructed not only to connect named entities but to think in terms of units of meaning. These units consist of smaller groups of events, such as the timeline of a surgery, the family history, or the events that happened before admission. These smaller units should then be linked to each other, creating a larger group. This should be repeated until all larger units of meaning are linked into one large, comprehensive timeline. If possible, the anchors for these temporal units should be TIMEX3 entities, preferably Dates. A fictitious example for these linkage conventions can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          <p>These conventions result in a number of different graphs that, in the worst case, might share no edges at all. This would lead to a much worse agreement score than justified. The solution we propose here is to use inference and temporal closure [<xref ref-type="bibr" rid="ref93">93</xref>]. We infer the missing edges for each annotator and are thus able to calculate a pairwise agreement score (namely precision, recall, and <italic>F</italic><sub>1</sub>-score; see below). Based on the overlap of temporal relation definitions, we used a slightly adjusted version of the THYME evaluation script. The changes included adjustments to our annotation format (BRAT) [<xref ref-type="bibr" rid="ref94">94</xref>], extending the evaluation, and the visualization of annotations.</p>
        </sec>
        <sec>
          <title>Training and Evaluation of a Baseline Temporal Tagger</title>
          <p>To demonstrate the usefulness of the outcome of our annotation campaign and to determine the first baseline for the automatic temporal tagging of German clinical documents, we used state-of-the-art transformer-based classification technology, that is, BERT (Bidirectional Encoder Representations from Transformers)-ish language models. For German, the most recent and best-performing language model is the German BERT model (GBERT) [<xref ref-type="bibr" rid="ref95">95</xref>]. For our experiments, we used the base model for each of the downstream tasks we specified. To automatically optimize hyperparameters for each task, we used Bayesian Optimization and Hyperband [<xref ref-type="bibr" rid="ref96">96</xref>] (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Our experiments incorporate the huggingface library [<xref ref-type="bibr" rid="ref97">97</xref>], as well as the Bayesian Optimization and Hyperband implementation of the Microsoft NNI framework [<xref ref-type="bibr" rid="ref98">98</xref>]. This configuration was applied to and evaluated on the nonsharable 3000PA (ie, 3000PA<sub>J</sub>) and the publicly sharable GraSCCo corpus. The ground truth data used for training, testing, and evaluation were taken from the annotated documents without further correction. If the document was part of the agreement partition, and thus had been annotated by all annotators independently, we randomly selected one annotation variant from one annotator.</p>
        </sec>
        <sec>
          <title>Evaluation Metrics</title>
          <p>For the statistical evaluation, we apply the following metrics.</p>
          <p>Precision (P), also known as positive predictive value, is the ratio between the gold-standard matching annotations of all named entities or temporal relations for each label (true positives) and all annotated named entities or temporal relations for each label (true positives + false positives).</p>
          <disp-formula>
            <graphic xlink:href="jmir_v28i1e71458_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p>Recall (R), also called sensitivity, is the ratio between the gold-standard matching annotations of all named entities or temporal relations for each label (true positives) and all annotated named entities or temporal relations for each label (true positives and false negatives).</p>
          <disp-formula>
            <graphic xlink:href="jmir_v28i1e71458_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p><italic>F</italic><sub>1</sub>-score is defined as the harmonic mean of precision and recall.</p>
          <disp-formula>
            <graphic xlink:href="jmir_v28i1e71458_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p>Accuracy (Acc) is defined as the ratio between the gold-standard matching annotations (true positives and true negatives) and all annotations, regardless of their annotations being true or false (sum of annotated entities).</p>
          <disp-formula>
            <graphic xlink:href="jmir_v28i1e71458_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p>All of these measurements were calculated pairwise between all possible annotator pairs. The final agreement score for the labels or the entire corpus reports the averaged pairwise agreement scores.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>We present the results of our experiments, distinguishing between manual temporal named entity and temporal relation annotations, as well as the evaluation of the GBERT baseline tagging model that automatically generates temporal tags for clinical documents.</p>
      </sec>
      <sec>
        <title>Annotation of Temporal Named Entities</title>
        <p>In the first cycle of our 2 annotation campaigns, we annotated temporal named entities on both 3000PA<sub>J</sub> and GraSCCo. The results presented here were calculated on the corrected named entity annotations after the relation annotation campaign with its named entity correction subtask.</p>
        <p>As can be seen in <xref ref-type="table" rid="table6">Table 6</xref>, we achieved pairwise <italic>F</italic><sub>1</sub>-scores above 0.8 for nearly all named entity types. Moreover, our overall agreement even exceeds an average <italic>F</italic><sub>1</sub>-score above 0.9. When looking at the token-level evaluation (which is less strict), we achieved an overall agreement average <italic>F</italic><sub>1</sub>-score for 3000PA<sub>J</sub> of 0.912 and 0.910 for GraSCCo.</p>
        <p>On both datasets, the entity type Duration yielded slightly worse scores. There is only one major outlier in terms of IAA in the 3000PA<sub>J</sub> results, namely Quantifier, both in terms of <italic>F</italic><sub>1</sub>-score and SD. Interestingly, this is not observed in GraSCCo. When looking at the confusion matrix of the named entities of both datasets in <xref rid="figure6" ref-type="fig">Figure 6</xref>, we are able to explain this deviant behavior.</p>
        <p>As can be seen in the confusion matrices for entity types of both corpora in <xref rid="figure6" ref-type="fig">Figure 6</xref>, the main reason for mismatching labels was mostly missing annotations, labeled “None” in the confusion matrix. The Event type, in particular, was often only annotated by one annotator. This behavior can be observed for both corpora. Interestingly, in 3000PA<sub>J</sub>, the type Quantifier was also often missed by one of the annotators. The most often confused label pair was Date and Duration. Some translated examples for confused label pairs are:</p>
        <list list-type="bullet">
          <list-item>
            <p>{since 2017}DURATION vs since {2017}DATE</p>
          </list-item>
          <list-item>
            <p>{the entire night}DURATION vs the entire {night}DATE</p>
          </list-item>
          <list-item>
            <p>{after about 30 minutes}DURATION vs after about {30 minutes}TIME</p>
          </list-item>
          <list-item>
            <p>{day of self-harm}DATE vs day of {self-harm}EVENT</p>
          </list-item>
        </list>
        <p>Some systematic errors also appear in the distinction between Duration and Date. Most of the mismatches were grounded in some form of trigger word, such as “since” or “after”. However, it needs to be stressed that these kinds of errors did not occur too often relative to all cases, as can be seen in the confusion matrices in <xref rid="figure6" ref-type="fig">Figure 6</xref>. Mismatches between labels other than the ones described above are very rare (per milli range).</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Absolute number and relative number in percentage of named entities, mean pairwise F1-score with SD for each entity type of the temporal named entity annotation campaign for 3000PAJ and GraSCCo, respectively, as well as the overall agreement for each dataset, which also includes the nonannotated tokens.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="100"/>
            <col width="130"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="130"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>Named entity</td>
                <td colspan="4">3000PA<sub>J</sub></td>
                <td colspan="4">GraSCCo</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Absolute number</td>
                <td>Percentage (%)</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td>SD</td>
                <td>Absolute number</td>
                <td>Percentage (%)</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td>SD</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Date</td>
                <td>9099</td>
                <td>15.13</td>
                <td>0.903</td>
                <td>0.055</td>
                <td>663</td>
                <td>11.51</td>
                <td>0.947</td>
                <td>0.020</td>
              </tr>
              <tr valign="top">
                <td>DocTime</td>
                <td>886</td>
                <td>1.47</td>
                <td>0.988</td>
                <td>0.007</td>
                <td>92</td>
                <td>1.60</td>
                <td>0.944</td>
                <td>0.031</td>
              </tr>
              <tr valign="top">
                <td>Time</td>
                <td>593</td>
                <td>0.99</td>
                <td>0.893</td>
                <td>0.058</td>
                <td>3</td>
                <td>0.75</td>
                <td>0.852</td>
                <td>0.075</td>
              </tr>
              <tr valign="top">
                <td>Duration</td>
                <td>824</td>
                <td>1.38</td>
                <td>0.776</td>
                <td>0.083</td>
                <td>138</td>
                <td>2.40</td>
                <td>0.747</td>
                <td>0.091</td>
              </tr>
              <tr valign="top">
                <td>Set</td>
                <td>1107</td>
                <td>1.84</td>
                <td>0.822</td>
                <td>0.081</td>
                <td>158</td>
                <td>2.74</td>
                <td>0.802</td>
                <td>0.107</td>
              </tr>
              <tr valign="top">
                <td>Quantifier</td>
                <td>563</td>
                <td>0.94</td>
                <td>0.550</td>
                <td>0.209</td>
                <td>118</td>
                <td>2.05</td>
                <td>0.938</td>
                <td>0.023</td>
              </tr>
              <tr valign="top">
                <td>PrePost</td>
                <td>146</td>
                <td>0.24</td>
                <td>0.831</td>
                <td>0.041</td>
                <td>24</td>
                <td>0.42</td>
                <td>0.932</td>
                <td>0.041</td>
              </tr>
              <tr valign="top">
                <td>EVENT</td>
                <td>46,909</td>
                <td>78.02</td>
                <td>0.910</td>
                <td>0.017</td>
                <td>4523</td>
                <td>78.54</td>
                <td>0.906</td>
                <td>0.053</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>60,127</td>
                <td>100.0</td>
                <td>0.834</td>
                <td>0.068</td>
                <td>5759</td>
                <td>100.0</td>
                <td>0.883</td>
                <td>0.055</td>
              </tr>
              <tr valign="top">
                <td>Overall Agreement</td>
                <td>—<sup>a</sup></td>
                <td>—</td>
                <td>0.904</td>
                <td>0.024</td>
                <td>—</td>
                <td>—</td>
                <td>0.906</td>
                <td>0.047</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Confusion matrices for temporal named entity types after correction, with 3000PAJ (left) and GraSCCo (right). The color and intensity indicate the relative number of entity pairs (with 1.0 being all and 0.0 no existing pairs). Agreeing pairs (both annotators chose the same label) can be found on the main diagonal.</p>
          </caption>
          <graphic xlink:href="jmir_v28i1e71458_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Annotation of Temporal Relations</title>
        <p>Because of their complexity and the human efforts required for this task, temporal relations were annotated only on a randomly chosen subset of 350 documents of the original 3000PA<sub>J</sub> dataset, whereas all 63 documents of the GraSCCo dataset were dealt with. Both datasets were annotated by the same 4 annotators. The resulting IAA scores incorporating the aforementioned inference rules are depicted in <xref ref-type="table" rid="table7">Table 7</xref>. Because of the nature of points in time and their relation to each other (they form a fully connected temporal graph), relations between 2 named entity pairs always have a relation type, even though it might be automatically inferred rather than manually annotated.</p>
        <p>As can be seen in the total count of relation types, in GraSCCo all entities seem to be connected with each other, as the number of relation types is slightly larger (40 relations more than necessary) than the total number of entity types. But in 3000PA<sub>J</sub> we seem to miss a total of about 1k relations, which means approximately 3 relations per document. However, given the total number of about 60k annotated relations, this is just 1.76% of the anticipated number of relations.</p>
        <p>The confusion matrices for the 5 temporal relation types of both datasets are depicted in <xref rid="figure7" ref-type="fig">Figure 7</xref>.</p>
        <p>The most prominent observation in both confusion matrices is the dominance of the CONTAINS relation type. Especially, OVERLAP was often confused with CONTAINS in both datasets. This is not so surprising given that CONTAINS is a subset of OVERLAP. However, it seems that the stricter CONTAINS relation is used more often compared with the less restrictive OVERLAP relation. We assume that the reason for this phenomenon might be the fact that we hired medical students rather than linguists or computer scientists (an issue often observed in other annotation campaigns, as well). Thus, our annotators have attributed the relation types a more literal meaning, “something contains something”, even partially, and did not share our set theory-based understanding of CONTAINS and OVERLAP. Unfortunately, in the 3000PA<sub>J</sub> corpus, all of the other relation types are often confused with the CONTAINS relation type. Discussions with the annotators revealed that they used the CONTAINS relation type as a residual category, which resulted in generally coding CONTAINS if they were unsure about other alternatives. However, mismatches between other labels occur very rarely (per mille range).</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Absolute numbers and relative numbers in percentage of temporal relations, mean pairwise F1-score with SD for each annotated type of the temporal relation annotation campaign on 3000PAJ and GraSCCo using temporal closure.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="140"/>
            <col width="120"/>
            <col width="100"/>
            <col width="100"/>
            <col width="0"/>
            <col width="140"/>
            <col width="120"/>
            <col width="70"/>
            <col width="70"/>
            <thead>
              <tr valign="top">
                <td>Relation type</td>
                <td colspan="5">3000PA<sub>J</sub></td>
                <td colspan="4">GraSCCo</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Absolute number</td>
                <td>Percentage (%)</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td>SD</td>
                <td colspan="2">Absolute number</td>
                <td>Percentage (%)</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td>SD</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>BEFORE</td>
                <td>5948</td>
                <td>10.07</td>
                <td>0.2</td>
                <td>0.07</td>
                <td colspan="2">547</td>
                <td>9.43</td>
                <td>0.45</td>
                <td>0.28</td>
              </tr>
              <tr valign="top">
                <td>BEGINS-ON</td>
                <td>1030</td>
                <td>1.74</td>
                <td>0.48</td>
                <td>0.07</td>
                <td colspan="2">146</td>
                <td>2.52</td>
                <td>0.64</td>
                <td>0.19</td>
              </tr>
              <tr valign="top">
                <td>ENDS-ON</td>
                <td>724</td>
                <td>1.23</td>
                <td>0.69</td>
                <td>0.06</td>
                <td colspan="2">74</td>
                <td>1.28</td>
                <td>0.73</td>
                <td>0.14</td>
              </tr>
              <tr valign="top">
                <td>OVERLAP</td>
                <td>5046</td>
                <td>8.54</td>
                <td>0.09</td>
                <td>0.13</td>
                <td colspan="2">679</td>
                <td>11.71</td>
                <td>0.33</td>
                <td>0.36</td>
              </tr>
              <tr valign="top">
                <td>CONTAINS</td>
                <td>46,318</td>
                <td>78.42</td>
                <td>0.63</td>
                <td>0.07</td>
                <td colspan="2">4352</td>
                <td>75.06</td>
                <td>0.68</td>
                <td>0.16</td>
              </tr>
              <tr valign="top">
                <td>Overall agreement</td>
                <td>59,066</td>
                <td>100.0</td>
                <td>0.41</td>
                <td>0.08</td>
                <td colspan="2">5798</td>
                <td>100.0</td>
                <td>0.57</td>
                <td>0.27</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Confusion matrices for temporal relation types, with 3000PAJ (left) and GraSCCo (right). The color and intensity indicate the relative number of relation label pairs (with 1.0 being all and 0.0 no existing pairs). Agreeing pairs can be found on the main diagonal.</p>
          </caption>
          <graphic xlink:href="jmir_v28i1e71458_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Baseline Model for Automatic Temporal Tagging</title>
        <p>For the evaluation of the performance of the automatic temporal taggers trained on our annotated datasets, we fine-tuned and optimized a GBERT on both 3000PA<sub>J</sub> and GraSCCo. A summary of the results of our experiments can be found in <xref ref-type="table" rid="table8">Table 8</xref>.</p>
        <p>All in all, GBERT performs well for both the named entity recognition (NER) and the relation extraction task, respectively, on the 3000PA<sub>J</sub> dataset. Training GBERT on 3000PA<sub>J</sub> and testing on GraSCCo results in an expected, yet acceptable, drop in performance. Interestingly, this drop mostly affects the recall score. The union of both datasets results in a similar performance rate compared with the model trained on 3000PA<sub>J</sub> only, yet with a slight decrease in recall and a slight increase in precision, which results in a similar <italic>F</italic><sub>1</sub>-score for both the named entity recognition and the relation extraction task.</p>
        <table-wrap position="float" id="table8">
          <label>Table 8</label>
          <caption>
            <p>Mean pairwise accuracy (Acc), F1-score, precision, and recall for automatic temporal named entity recognition (NER) and relation extraction (REX) on 3000PAJ and GraSCCo, respectively, and a unified set of both (union).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="170"/>
            <col width="150"/>
            <col width="150"/>
            <col width="80"/>
            <col width="140"/>
            <col width="160"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Model</td>
                <td>Train set</td>
                <td>Test set</td>
                <td>Acc</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td>Precision</td>
                <td>Recall</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>NER</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT<sup>a</sup></td>
                <td>3000PA<sub>J</sub></td>
                <td>3000PA<sub>J</sub></td>
                <td>0.95</td>
                <td>0.78</td>
                <td>0.73</td>
                <td>0.84</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT</td>
                <td>GraSCCo</td>
                <td>GraSCCo</td>
                <td>0.94</td>
                <td>0.85</td>
                <td>0.84</td>
                <td>0.87</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT</td>
                <td>3000PA<sub>J</sub></td>
                <td>GraSCCo</td>
                <td>0.90</td>
                <td>0.64</td>
                <td>0.82</td>
                <td>0.56</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT</td>
                <td>union</td>
                <td>union</td>
                <td>0.95</td>
                <td>0.77</td>
                <td>0.75</td>
                <td>0.80</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>REX</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT</td>
                <td>3000PA<sub>J</sub></td>
                <td>3000PA<sub>J</sub></td>
                <td>0.78</td>
                <td>0.64</td>
                <td>0.63</td>
                <td>0.63</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT</td>
                <td>GraSCCo</td>
                <td>GraSCCo</td>
                <td>0.81</td>
                <td>0.60</td>
                <td>0.63</td>
                <td>0.58</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT</td>
                <td>3000PA<sub>J</sub></td>
                <td>GraSCCo</td>
                <td>0.90</td>
                <td>0.64</td>
                <td>0.82</td>
                <td>0.56</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GBERT</td>
                <td>union</td>
                <td>union</td>
                <td>0.81</td>
                <td>0.63</td>
                <td>0.70</td>
                <td>0.59</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table8fn1">
              <p><sup>a</sup>GBERT: German BERT model.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Temporal information is crucial for comprehensive medical reasoning; yet, only a few data resources are available for NLP tools to automatically extract such information from clinical documents. Publicly accessible clinical document collections have primarily emerged from challenge tasks, such as i2b2, n2c2, or Clinical TempEval, but cover the English clinical language only (<xref ref-type="table" rid="table2">Table 2</xref>). For a few non-English clinical language communities—French, Chinese (Mandarin), Spanish, Italian, Portuguese, German, Swedish, and Japanese—clinical corpora have been annotated with temporal metadata, but (except for E3C, a multilingual case report corpus) none of them is publicly available due to prohibitive data privacy regulations (<xref ref-type="table" rid="table4">Tables 4</xref> and <xref ref-type="table" rid="table8">8</xref>). We here introduced 2 corpora for the German clinical language annotated with TimeML-compliant metadata—a nondistributable real-world clinical corpus (3000PA<sub>J</sub>), and a distributable synthetic one (GraSCCo). The first stands out with unprecedented quantitative scales in terms of the number of documents, tokens, and temporal metadata, and its adherence to qualitative standards, that is, TimeML specifications, lacking for many non-English alternatives (<xref ref-type="table" rid="table8">Table 8</xref>). The latter, though small-sized and synthetic, is one of the rare (if not the only one) non-English clinical text resources marked up for temporal information that are accessible without distribution restrictions. With reasonable agreement scores for manual annotation, we trained and tested temporal BERT-based taggers under varying experimental conditions and achieved decent performance values using both, 3000PAJ and GraSCCo.</p>
      </sec>
      <sec>
        <title>Principal Results</title>
        <p>In this article, we introduced 2 corpora equipped with temporal metadata for the German clinical language. The first of these corpora, 3000PA<sub>J</sub>, contains real clinical documents, but cannot be distributed in the public domain due to the restrictive privacy legislation codified in Germany and (more generally) Europe. To bypass this severe accessibility hurdle, we enriched a second corpus, GraSCCo, with temporal metadata, which can be distributed without any restrictions since it contains synthetic data, that is, fictitious and noise-adding content, only. The metadata we created for temporal named entities and relations, all of them fully compliant with TimeML, have a high level of credibility, given IAA scores ranging in the high 80s and low 90s.</p>
        <p>As can also be seen from our evaluation results, we are on par performance-wise with comparable English corpora, such as THYME. For named entities and the CONTAINS relation, we even achieved better results on both corpora, 3000PA<sub>J</sub> and GraSCCo. In addition, all documents used in the agreement evaluation were annotated by 4 individual annotators per document and yielded acceptable IAA scores.</p>
        <p>In the end, we come up with about 66k temporal entities and 65k temporal relations, which sum up to 131k temporal annotation units for both corpora. These numbers not only exceed all clinical and nonclinical German-language corpora in terms of temporal metadata created up until now, but also outdo all clinical English time-focused corpora. Only the million-scale nonclinical Maven-Ere corpus [<xref ref-type="bibr" rid="ref40">40</xref>] offers a (much) larger number of temporal annotations.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>We still have to increase the size of GraSCCo (this is ongoing work in our research group). Also, the baseline tagger needs to be complemented by more sophisticated and larger language models. We plan to experiment with temporal (knowledge graph) embeddings, which encode temporal information directly in time-enhanced embeddings [<xref ref-type="bibr" rid="ref99">99</xref>-<xref ref-type="bibr" rid="ref101">101</xref>] and document-level event extraction models [<xref ref-type="bibr" rid="ref102">102</xref>-<xref ref-type="bibr" rid="ref104">104</xref>], which will better accommodate long-range cross-sentence and cross-paragraph dependencies typical of temporal relations in long documents, such as clinical reports.</p>
        <p>As discussed in the results section, the decision to use only medical students resulted in misconceptions regarding the definitions of the temporal relations. Potentially, mixed teams with medical students and annotators with a background in linguistics or computer science might have resulted in better results (as small preliminary experiments for i2b2 2012 and CLEF suggest [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref105">105</xref>]). However, as shown by Raghavan et al [<xref ref-type="bibr" rid="ref106">106</xref>], the level of clinical expertise has only a small impact on the inter-annotator reliability for temporal relations. Furthermore, medical students are more likely to recognize relations between clinical events [<xref ref-type="bibr" rid="ref105">105</xref>], as well as relations based on medical causal dependence [<xref ref-type="bibr" rid="ref105">105</xref>]. Additionally, we used the involuntary break and access restrictions during the COVID pandemic for extensive training iterations for our annotator team. Thus, if we compare our work with THYME, which was annotated by mixed teams as well, they reported similar difficulties and <italic>F</italic><sub>1</sub>-scores to those discussed above.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>To the best of our knowledge, 3000PA<sub>J</sub> and GraSCCo are the first German clinical corpora to be annotated with temporal named entities and relations fully compliant with the TimeML de facto markup standard. Surprisingly, for nonclinical documents, no comprehensive TimeML-compliant corpus currently exists for German. Furthermore, providing unconstrained access to the synthetic GraSCCo corpus constitutes a major step in metadata availability for the German clinical NLP community. Moreover, the construction principles underlying GraSCCo [<xref ref-type="bibr" rid="ref82">82</xref>] outline a way to extend the generation (not only) of temporal metadata beyond the German language. For the first time ever, a TimeML-compliant baseline temporal tagger for German has been trained and properly validated.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our work can and will be the basis for algorithms and models to automatically detect and combine temporal entities and their relations in order to create clinical timelines [<xref ref-type="bibr" rid="ref107">107</xref>,<xref ref-type="bibr" rid="ref108">108</xref>]. These timelines will be visualized and are thus able to provide a comprehensive summary of the patients’ clinical history, a potentially valuable source of abstraction for all kinds of clinical decision makers and caretakers.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Example for relation annotation schema.</p>
        <media xlink:href="jmir_v28i1e71458_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 464 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Hyperparameter for transformer training.</p>
        <media xlink:href="jmir_v28i1e71458_app2.docx" xlink:title="DOCX File , 9 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">GBERT</term>
          <def>
            <p>German BERT model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">IAA</term>
          <def>
            <p>interannotator agreement</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ISO</term>
          <def>
            <p>International Organization for Standardization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We thank Prof Dr André Scherag, Dr Danny Ammon, and all members of the Data Integration Center of the Jena University Hospital for their continuous support in managing access to 3000PA<sub>J</sub>.</p>
      <p>No artificial intelligence assistance has been used in the writing process of this paper; all text, figures, and tables have been created manually by the authors.</p>
    </ack>
    <notes>
      <sec>
        <title>Funding</title>
        <p>This work was supported by the German Ministry of Education and Research (BMBF) within the SMITH and DIFUTURE clusters of the Medical Informatics Initiative (MI-I) under the grants 01ZZ1803G and 01ZZ2009A, respectively.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>LM contributed to the conceptualization of the study, data curation, formal analysis, conduct of experiments, methodology design, provision of resources, software development, validation, visualization, and writing of both the original draft and the review and editing of the manuscript. UH was responsible for funding acquisition, provision of resources, project administration, and supervision, and also contributed to writing the original draft and reviewing and editing the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rastegar-Mojarad</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrabi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Clinical information extraction applications: a literature review</article-title>
          <source>J Biomed Inform</source>
          <year>2018</year>
          <volume>77</volume>
          <fpage>34</fpage>
          <lpage>49</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(17)30256-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.11.011</pub-id>
          <pub-id pub-id-type="medline">29162496</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(17)30256-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC5771858</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bose</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sleeman</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Palta</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kapoor</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A survey on recent named entity recognition and relationship extraction techniques on clinical texts</article-title>
          <source>Appl Sci</source>
          <year>2021</year>
          <volume>11</volume>
          <issue>18</issue>
          <fpage>8319</fpage>
          <pub-id pub-id-type="doi">10.3390/app11188319</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nasar</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Jaffry</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Malik</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Named entity recognition and relation extraction</article-title>
          <source>ACM Comput Surv</source>
          <year>2021</year>
          <volume>54</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>39</lpage>
          <pub-id pub-id-type="doi">10.1145/3445965</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madkour</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Benhaddou</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Temporal data representation, normalization, extraction, and reasoning: a review from clinical domain</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2016</year>
          <volume>128</volume>
          <fpage>52</fpage>
          <lpage>68</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27040831"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2016.02.007</pub-id>
          <pub-id pub-id-type="medline">27040831</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(15)30118-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC4837648</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leeuwenberg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moens</surname>
              <given-names>MF</given-names>
            </name>
          </person-group>
          <article-title>A survey on temporal reasoning for temporal information extraction from text</article-title>
          <source>J Artif Intell Res</source>
          <year>2019</year>
          <volume>66</volume>
          <fpage>341</fpage>
          <lpage>380</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.1.11727</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alfattni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Peek</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Extraction of temporal relations from clinical free text: a systematic review of current approaches</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <volume>108</volume>
          <fpage>103488</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30116-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103488</pub-id>
          <pub-id pub-id-type="medline">32673788</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30116-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gumiel</surname>
              <given-names>YB</given-names>
            </name>
            <name name-style="western">
              <surname>Silva e Oliveira</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Claveau</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Grabar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Paraiso</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Moro</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Carvalho</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Temporal relation extraction in clinical texts</article-title>
          <source>ACM Comput Surv</source>
          <year>2021</year>
          <volume>54</volume>
          <issue>7</issue>
          <fpage>1</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1145/3462475</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>Clinical document corpora-real ones, translated and synthetic substitutes, and assorted domain proxies: a survey of diversity in corpus design, with focus on German text data</article-title>
          <source>JAMIA Open</source>
          <year>2025</year>
          <volume>8</volume>
          <issue>3</issue>
          <fpage>ooaf024</fpage>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooaf024</pub-id>
          <pub-id pub-id-type="medline">40371384</pub-id>
          <pub-id pub-id-type="pii">ooaf024</pub-id>
          <pub-id pub-id-type="pmcid">PMC12077144</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rumshisky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Temporal reasoning over clinical text: the state of the art</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>814</fpage>
          <lpage>819</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23676245"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2013-001760</pub-id>
          <pub-id pub-id-type="medline">23676245</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2013-001760</pub-id>
          <pub-id pub-id-type="pmcid">PMC3756277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kamsu-Foguem</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tchuenté-Foguem</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Foguem</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Verifying a medical protocol with temporal graphs: the case of a nosocomial disease</article-title>
          <source>J Crit Care</source>
          <year>2014</year>
          <volume>29</volume>
          <issue>4</issue>
          <fpage>690.e1</fpage>
          <lpage>e9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jcrc.2014.02.006</pub-id>
          <pub-id pub-id-type="medline">24636931</pub-id>
          <pub-id pub-id-type="pii">S0883-9441(14)00060-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>STI</given-names>
            </name>
            <name name-style="western">
              <surname>Juhn</surname>
              <given-names>YJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Patient-level temporal aggregation for text-based asthma status ascertainment</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2014</year>
          <volume>21</volume>
          <issue>5</issue>
          <fpage>876</fpage>
          <lpage>884</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24833775"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002463</pub-id>
          <pub-id pub-id-type="medline">24833775</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2013-002463</pub-id>
          <pub-id pub-id-type="pmcid">PMC4147607</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caballero Barajas</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Akella</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Dynamically modeling patient's health state from electronic medical records: a time series approach</article-title>
          <year>2015</year>
          <conf-name>KDD - 15 - Proceedings of the 21st ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>2015 Aug 10</conf-date>
          <conf-loc>Sydney, New South Wales, Australia</conf-loc>
          <publisher-name>Association for Computing Machinery (ACM)</publisher-name>
          <fpage>69</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1145/2783258.2783289</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Loghmanpour</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Penstein-Rosé</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Time series analysis of nursing notes for mortality prediction via a state transition topic model</article-title>
          <year>2015</year>
          <conf-name>CIKM - 15 - Proceedings of the 24th ACM International Conference on Information and Knowledge Management</conf-name>
          <conf-date>2015 Oct 19</conf-date>
          <conf-loc>Melbourne, Victoria, Australia</conf-loc>
          <publisher-name>Association for Computing Machinery (ACM)</publisher-name>
          <fpage>1171</fpage>
          <lpage>1180</lpage>
          <pub-id pub-id-type="doi">10.1145/2806416.2806541</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qiao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Pairwise-ranking based collaborative recurrent neural networks for clinical event prediction</article-title>
          <year>2018</year>
          <conf-name>IJCAI-ECAI '18 - Proceedings of the 27th International Joint Conference on Artificial Intelligence &#38; 23rd European Conference on Artificial Intelligence</conf-name>
          <conf-date>2018 July 13</conf-date>
          <conf-loc>Stockholm, Sweden</conf-loc>
          <fpage>3520</fpage>
          <lpage>3526</lpage>
          <pub-id pub-id-type="doi">10.24963/ijcai.2018/489</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khadanga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aggarwal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Joty</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using clinical notes with time series data for ICU management</article-title>
          <year>2019</year>
          <conf-name>EMNLP-IJCNLP  - Proceedings of the  Conference on Empirical Methods in Natural Language Processing &#38; 9th International Joint Conference on Natural Language Processing;  November ; Hong Kong, China. Association for Computational Linguistics (ACL)</conf-name>
          <conf-date>2019 Nov 03</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>6432</fpage>
          <lpage>6437</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/D19-1678/"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/d19-1678</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Najafabadipour</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zanin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rodríguez-González</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Torrente</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nuñez García</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz Bermudez</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Provencio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Menasalvas</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Reconstructing the patient's natural history from electronic health records</article-title>
          <source>Artif Intell Med</source>
          <year>2020</year>
          <volume>105</volume>
          <fpage>101860</fpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2020.101860</pub-id>
          <pub-id pub-id-type="medline">32505419</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(19)31146-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deznabi</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Iyyer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fiterau</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Predicting in-hospital mortality by combining clinical notes with time-series data</article-title>
          <year>2021</year>
          <conf-name>Findings of the Association for Computational Linguistics - ACL-IJCNLP 2021</conf-name>
          <conf-date>2021 Aug 01</conf-date>
          <conf-loc>USA</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>4026</fpage>
          <lpage>4031</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2021.findings-acl.352/"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2021.findings-acl.352</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olex</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>BT</given-names>
            </name>
          </person-group>
          <article-title>Review of temporal reasoning in the clinical domain for timeline extraction: where we are and where we need to be</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <volume>118</volume>
          <fpage>103784</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00113-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103784</pub-id>
          <pub-id pub-id-type="medline">33862232</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00113-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>MEH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N`</given-names>
            </name>
          </person-group>
          <article-title>Deep learning for temporal data representation in electronic health records: a systematic review of challenges and methodologies</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <volume>126</volume>
          <fpage>103980</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00309-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103980</pub-id>
          <pub-id pub-id-type="medline">34974189</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00309-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Time interval uncertainty-aware and text-enhanced based disease prediction</article-title>
          <source>J Biomed Inform</source>
          <year>2023</year>
          <volume>139</volume>
          <fpage>104239</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(22)00244-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104239</pub-id>
          <pub-id pub-id-type="medline">36356933</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00244-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Towards a general theory of action and time</article-title>
          <source>Artif Intell</source>
          <year>1984</year>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>123</fpage>
          <lpage>154</lpage>
          <pub-id pub-id-type="doi">10.1016/0004-3702(84)90008-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Castaño</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ingria</surname>
              <given-names>RJP</given-names>
            </name>
            <name name-style="western">
              <surname>Saurí</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gaizauskas</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Setzer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>TIMEML: robust specification of event and temporal expressions in text</article-title>
          <source>New Directions in Question Answering</source>
          <year>2003</year>
          <publisher-loc>Washington, D.C</publisher-loc>
          <publisher-name>AAAI Press</publisher-name>
          <fpage>28</fpage>
          <lpage>34</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bunt</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Romary</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>ISO-TIMEML : an international standard for semantic annotation</article-title>
          <year>2010</year>
          <conf-name>LREC 2010 - Proceedings of the 7th International Conference on Language Resources and Evaluation</conf-name>
          <conf-date>2010 May 17</conf-date>
          <conf-loc>La Valletta, Malta</conf-loc>
          <publisher-name>European Language Resources Association (ELRA)</publisher-name>
          <fpage>394</fpage>
          <lpage>397</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/L10-1027/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferro</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gerber</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mani</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sundheim</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>TIDES 2005 standard for the annotation of temporal expressions</article-title>
          <source>Linguistic Data Consortium</source>
          <year>2005</year>
          <access-date>2025-08-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ldc.upenn.edu/sites/www.ldc.upenn.edu/files/english-timex2-guidelines-v0.1.pdf">https://www.ldc.upenn.edu/sites/www.ldc.upenn.edu/files/english-timex2-guidelines-v0.1.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Hanks</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Saurí</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>See</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gaizauskas</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Setzer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The TIMEBANK corpus</article-title>
          <year>2003</year>
          <conf-name>Proceedings of the Corpus Linguistics 2003 Conference</conf-name>
          <conf-date>2003 March 28</conf-date>
          <conf-loc>Lancaster, UK</conf-loc>
          <fpage>647</fpage>
          <lpage>656</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boguraev</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Ando</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>TimeBank evolution as a community resource for TimeML parsing</article-title>
          <source>Lang Resour Evaluation</source>
          <year>2007</year>
          <volume>41</volume>
          <issue>1</issue>
          <fpage>91</fpage>
          <lpage>115</lpage>
          <pub-id pub-id-type="doi">10.1007/s10579-007-9018-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ocal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Radas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hummer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Megerdoomian</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive evaluation and correction of the Time Bank corpus</article-title>
          <year>2022</year>
          <conf-name>Proceedings of the 13th International Conference on Language Resources and Evaluation</conf-name>
          <conf-date>2022 June 20</conf-date>
          <conf-loc>Marseille, France</conf-loc>
          <publisher-name>European Language Resources Association (ELRA)</publisher-name>
          <fpage>20</fpage>
          <lpage>25</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2022.lrec-1.313/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cassidy</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McDowell</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chambers</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>An annotation framework for dense event ordering</article-title>
          <year>2014</year>
          <conf-name>ACL 2014 - Proceedings of the 52nd Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>2014 June 22</conf-date>
          <conf-loc>Baltimore, Maryland, USA</conf-loc>
          <publisher-name>Short Papers</publisher-name>
          <fpage>501</fpage>
          <lpage>506</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/p14-2082</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chambers</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Cassidy</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McDowell</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Dense event ordering with a multi-pass architecture</article-title>
          <source>Trans Assoc Comput Linguist</source>
          <year>2014</year>
          <volume>2</volume>
          <fpage>273</fpage>
          <lpage>284</lpage>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00182</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gaizauskas</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schilder</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hepple</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moszkowicz</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>The TempEval challenge: identifying temporal relations in text</article-title>
          <source>Lang Resour Evaluation</source>
          <year>2009</year>
          <volume>43</volume>
          <issue>2</issue>
          <fpage>161</fpage>
          <lpage>179</lpage>
          <pub-id pub-id-type="doi">10.1007/s10579-009-9086-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>UzZaman</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Llorens</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Derczynski</surname>
              <given-names>LRA</given-names>
            </name>
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2013 Task 1: TempEval-3 - evaluating time expressions, events, and temporal relations</article-title>
          <year>2013</year>
          <conf-name>SEM 2013 - Proceedings of the 2nd Joint Conference on Lexical and Computational Semantics</conf-name>
          <conf-date>2013 June 14</conf-date>
          <conf-loc>Atlanta, Georgia, USA</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>14</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/S13-2001/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saurí</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Caselli</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2010 Task 13: TempEval-2 - Evaluating events, time expressions, and temporal relations</article-title>
          <year>2010</year>
          <conf-name>SemEval 2010 - Proceedings of the 5th International Workshop on Semantic Evaluation @ ACL 2010</conf-name>
          <conf-date>2010 July 15</conf-date>
          <conf-loc>Uppsala, Sweden</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>57</fpage>
          <lpage>62</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/1859664.1859674"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Graff</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The AQUAINT corpus of English news text</article-title>
          <source>International Standard Language Resource Number</source>
          <year>2002</year>
          <access-date>2026-01-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.islrn.org/resources/153-002-267-999-9/">https://www.islrn.org/resources/153-002-267-999-9/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Minard</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Speranza</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Agirre</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Aldabe</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>van Erp</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Magnini</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Semeval-2015 Task 4: TimeLine - cross-document event ordering</article-title>
          <year>2015</year>
          <conf-name>SemEval 2015 - Proceedings of the 9th International Workshop on Semantic Evaluation @ NAACL-HLT 2015</conf-name>
          <conf-date>2015 June 04</conf-date>
          <conf-loc>Denver, Colorado, USA</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>778</fpage>
          <lpage>786</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/s15-2132</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Gorman</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wright-Bettner</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Richer event description: integrating event coreference with temporal, causal and bridging annotation</article-title>
          <year>2016</year>
          <conf-name>CNewsStory 2016 - Proceedings of the 2nd Workshop on Computing News Storylines @ EMNLP 2016</conf-name>
          <conf-date>2016 Nov 05</conf-date>
          <conf-loc>Austin, Texas, USA</conf-loc>
          <publisher-name>Curran Associates, Inc</publisher-name>
          <fpage>47</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w16-5706</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mostafazadeh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Grealish</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chambers</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderwende</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>CaTeRS : causal and temporal relation scheme for semantic annotation of event structures</article-title>
          <year>2016</year>
          <conf-name>EVENTS - Proceedings of the 4th Workshop on Events: Definition, Detection, Coreference, and Representation @ NAACL-HLT 2016</conf-name>
          <conf-date>2016 June 17</conf-date>
          <conf-loc>San Diego, California</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>51</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w16-1007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caselli</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Vossen</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The Event StoryLine corpus: a new benchmark for causal and temporal relation extraction</article-title>
          <year>2017</year>
          <conf-name>EventStory 2017 - Proceedings of the [1st] Workshop on Events and Stories in the News @ ACL 2017</conf-name>
          <conf-date>2017 Aug 04</conf-date>
          <conf-loc>Vancouver, British Columbia, Canada</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>77</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w17-2711</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silveira</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Doza</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>de Marneffe</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Bowman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Connor</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A gold standard dependency corpus for English</article-title>
          <year>2014</year>
          <conf-name>LREC 2014 - Proceedings of the 9th International Conference on Language Resources and Evaluation</conf-name>
          <conf-date>2014 May 26</conf-date>
          <conf-loc>Reykjavik, Iceland</conf-loc>
          <publisher-name>European Language Resources Association (ELRA)</publisher-name>
          <fpage>2897</fpage>
          <lpage>2904</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/L14-1067/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Min</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Annotating temporal dependency graphs via crowdsourcing</article-title>
          <year>2020</year>
          <conf-name>EMNLP 2020 - Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>2020 Nov 16</conf-date>
          <conf-loc>USA</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>5368</fpage>
          <lpage>5380</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.emnlp-main.432</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Maven-Ere: a unified large-scale dataset for event coreference, temporal, causal, and subevent relation extraction</article-title>
          <year>2022</year>
          <conf-name>EMNLP 2022 - Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>2022 Dec 07</conf-date>
          <conf-loc>Abu Dhabi, United Arab Emirates</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>926</fpage>
          <lpage>941</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2022.emnlp-main.60</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Karpinska</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lialin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Smelkov</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rumshisky</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Narrative Time : dense temporal annotation on a timeline</article-title>
          <year>2024</year>
          <conf-name>LREC-COLING 2024 - Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation</conf-name>
          <conf-date>2024 May 20</conf-date>
          <conf-loc>Torino, Italia</conf-loc>
          <publisher-name>European Language Resources Association (ELRA)</publisher-name>
          <fpage>12053</fpage>
          <lpage>12073</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2024.lrec-main.1054/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gaizauskas</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schilder</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hepple</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2007 Task 15: TempEval - Temporal relation identification</article-title>
          <year>2007</year>
          <conf-name>SemEval 2007 - Proceedings of the 4th International Workshop on Semantic Evaluations @ ACL 2007</conf-name>
          <conf-date>2007 June 23</conf-date>
          <conf-loc>Prague, Czech Republic</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>75</fpage>
          <lpage>80</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/S07-1014/"/>
          </comment>
          <pub-id pub-id-type="doi">10.3115/1621474.1621488</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Llorens</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chambers</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>UzZaman</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mostafazadeh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2015 task 5: QA TEMPEVAL - evaluating temporal information understanding with question answering</article-title>
          <year>2015</year>
          <conf-name>SemEval 2015 - Proceedings of the 9th International Workshop on Semantic Evaluation @ NAACL-HLT 2015</conf-name>
          <conf-date>2015 June 04</conf-date>
          <conf-loc>Denver, Colorado, USA</conf-loc>
          <publisher-name>Curran Associates, Inc</publisher-name>
          <fpage>792</fpage>
          <lpage>800</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/s15-2134</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Hirschman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>D'Avolio</surname>
              <given-names>LW</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Overcoming barriers to NLP for clinical text: the role of shared tasks and the need for additional creative solutions</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2011</year>
          <volume>18</volume>
          <issue>5</issue>
          <fpage>540</fpage>
          <lpage>543</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21846785"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000465</pub-id>
          <pub-id pub-id-type="medline">21846785</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000465</pub-id>
          <pub-id pub-id-type="pmcid">PMC3168329</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Filannino</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Advancing the state of the art in clinical natural language processing through shared tasks</article-title>
          <source>Yearb Med Inform</source>
          <year>2018</year>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>184</fpage>
          <lpage>192</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0038-1667079"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0038-1667079</pub-id>
          <pub-id pub-id-type="medline">30157522</pub-id>
          <pub-id pub-id-type="pmcid">PMC6115235</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vashishtha</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Van Durme</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Fine-grained temporal relation extraction</article-title>
          <year>2019</year>
          <conf-name>ACL 2019 - Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics;  - August 2; Florence, Italy. Association for Computational Linguistics (ACL). 2019</conf-name>
          <conf-date>2019 July 28</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>2906</fpage>
          <lpage>2919</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/p19-1280</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gaizauskas</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hepple</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Demetriou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Setzer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Building a semantically annotated corpus of clinical texts</article-title>
          <source>J Biomed Inform</source>
          <year>2009</year>
          <volume>42</volume>
          <issue>5</issue>
          <fpage>950</fpage>
          <lpage>966</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(09)00006-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2008.12.013</pub-id>
          <pub-id pub-id-type="medline">19535011</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(09)00006-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rumshisky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Evaluating temporal relations in clinical text: 2012 i2b2 challenge</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>806</fpage>
          <lpage>813</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23564629"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2013-001628</pub-id>
          <pub-id pub-id-type="medline">23564629</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2013-001628</pub-id>
          <pub-id pub-id-type="pmcid">PMC3756273</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rumshisky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Annotating temporal information in clinical narratives</article-title>
          <source>J Biomed Inform</source>
          <year>2013</year>
          <volume>46</volume>
          <fpage>S5</fpage>
          <lpage>S12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(13)00103-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2013.07.004</pub-id>
          <pub-id pub-id-type="medline">23872518</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(13)00103-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC3855581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Styler</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Finan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pradhan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>de Groen</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Erickson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Temporal annotation in the clinical domain</article-title>
          <source>Trans Assoc Comput Linguist</source>
          <year>2014</year>
          <volume>2</volume>
          <fpage>143</fpage>
          <lpage>154</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29082229"/>
          </comment>
          <pub-id pub-id-type="medline">29082229</pub-id>
          <pub-id pub-id-type="pmcid">PMC5657277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Derczynski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2015 task 6: clinical TempEval</article-title>
          <year>2015</year>
          <conf-name>SemEval 2015 - Proceedings of the 9th International Workshop on Semantic Evaluation @ NAACL-HLT 2015</conf-name>
          <conf-date>2015 June 04</conf-date>
          <conf-loc>Denver, Colorado, USA</conf-loc>
          <publisher-name>Curran Associates</publisher-name>
          <fpage>806</fpage>
          <lpage>814</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/s15-2136</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>WT</given-names>
            </name>
            <name name-style="western">
              <surname>Derczynski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2016 task 12: clinical TempEval</article-title>
          <year>2016</year>
          <conf-name>SemEval 2016 - Proceedings of the 10th International Workshop on Semantic Evaluation @ NAACL-HLT 2016</conf-name>
          <conf-date>2016 June 16</conf-date>
          <conf-loc>San Diego, California, USA</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>1052</fpage>
          <lpage>1062</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/s16-1165</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2017 task 12: clinical TempEval</article-title>
          <year>2017</year>
          <conf-name>SemEval 2017 - Proceedings of the 11th International Workshop on Semantic Evaluation @ ACL 2017</conf-name>
          <conf-date>2017 Aug 03</conf-date>
          <conf-loc>Vancouver, British Columbia, Canada</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>565</fpage>
          <lpage>572</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/s17-2093</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahajan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Tsou</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Overview of the 2022 n2c2 shared task on contextualized medication event extraction in clinical notes</article-title>
          <source>J Biomed Inform</source>
          <year>2023</year>
          <volume>144</volume>
          <fpage>104432</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(23)00153-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2023.104432</pub-id>
          <pub-id pub-id-type="medline">37356640</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(23)00153-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC10529825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Stubbs</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
          </person-group>
          <article-title>Creation of a new longitudinal corpus of clinical narratives</article-title>
          <source>J Biomed Inform</source>
          <year>2015</year>
          <volume>58</volume>
          <issue>Suppl</issue>
          <fpage>S6</fpage>
          <lpage>S10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(15)00212-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.09.018</pub-id>
          <pub-id pub-id-type="medline">26433122</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(15)00212-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC4978168</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Viani</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tissot</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bernardino</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Velupillai</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Annotating temporal information in clinical notes for timeline reconstruction: towards the definition of calendar expressions</article-title>
          <year>2019</year>
          <conf-name>BioNLP 2019 - Proceedings of the 18th SIGBioMed Workshop on Biomedical Natural Language Processing and Shared Task @ ACL 2019</conf-name>
          <conf-date>2019 Aug 01</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <fpage>201</fpage>
          <lpage>210</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w19-5021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spreyer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Projection-based acquisition of a temporal labeller</article-title>
          <year>2008</year>
          <conf-name>IJCNLP 2008 - Proceedings of the 3rd International Joint Conference on Natural Language Processing</conf-name>
          <conf-date>2008 Jan 07</conf-date>
          <conf-loc>Hyderabad, India</conf-loc>
          <publisher-name>Asian Federation of Natural Language Processing (AFNLP)</publisher-name>
          <fpage>489</fpage>
          <lpage>496</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/I08-1064/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strötgen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gertz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>WikiWarsDE: a German corpus of narratives annotated with temporal expressions</article-title>
          <source>Multilingual Resources and Multilingual Applications</source>
          <year>2011</year>
          <conf-name>GSCL 2011 - Proceedings of the Conference of the German Society for Computational Linguistics and Language Technology</conf-name>
          <conf-date>2011 Sep 28</conf-date>
          <conf-loc>Hamburg, Germany</conf-loc>
          <publisher-name>Hamburger Zentrum für Sprachkorpora</publisher-name>
          <fpage>129</fpage>
          <lpage>134</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dbs.ifi.uni-heidelberg.de/fileadmin/Team/jannik/publications/StroetgenGertz_WikiWarsDE_GSCL2011.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mazur</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dale</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>WIKIWARS : a new corpus for research on temporal expressions</article-title>
          <year>2010</year>
          <conf-name>EMNLP 2010 - Proceedings of the 2010 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>2010 Oct 09</conf-date>
          <conf-loc>Boston, Massachusetts, USA</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>913</fpage>
          <lpage>922</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/D10-1089/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strötgen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Minard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lange</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Speranza</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Magnini</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>KRAUTS: a German temporally annotated news corpus</article-title>
          <year>2018</year>
          <conf-name>LREC 2018 - Proceedings of the 11th International Conference on Language Resources and Evaluation</conf-name>
          <conf-date>2018 May 07</conf-date>
          <conf-loc>Miyazaki, Japan</conf-loc>
          <publisher-name>European Language Resources Association (ELRA)</publisher-name>
          <fpage>536</fpage>
          <lpage>540</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/L18-1085/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strötgen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gertz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Multilingual and cross-domain temporal tagging</article-title>
          <source>Lang Resour Evaluation</source>
          <year>2012</year>
          <volume>47</volume>
          <issue>2</issue>
          <fpage>269</fpage>
          <lpage>298</lpage>
          <pub-id pub-id-type="doi">10.1007/s10579-012-9179-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lücking</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stoeckel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abrami</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mehler</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>I still have time(s): extending HeidelTime for German texts</article-title>
          <year>2022</year>
          <conf-name>LREC 2022 - Proceedings of the 13th International Conference on Language Resources and Evaluation</conf-name>
          <conf-date>2022 June 20</conf-date>
          <conf-loc>Marseille, France</conf-loc>
          <publisher-name>European Language Resources Association (ELRA)</publisher-name>
          <fpage>4723</fpage>
          <lpage>4728</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2022.lrec-1.505/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roller</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Uszkoreit</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Seiffe</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mikhailov</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Staeck</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>A fine-grained corpus annotation schema of German nephrology records</article-title>
          <year>2016</year>
          <conf-name>ClinicalNLP 2016 - Proceedings of the 1st Workshop on Clinical Natural Language Processing @ COLING 2016</conf-name>
          <conf-date>2016 December 11</conf-date>
          <conf-loc>Osaka, Japan</conf-loc>
          <publisher-name>COLING 2016 Organizing Committee</publisher-name>
          <fpage>69</fpage>
          <lpage>77</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/W16-4210/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Campillos</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Deléger</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Grouin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hamon</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ligozat</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Névéol</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A French clinical corpus with comprehensive semantic annotations: development of the medical entity and relation LIMSI annOtated Text corpus (MERLOT)</article-title>
          <source>Lang Resour Evaluation</source>
          <year>2017</year>
          <volume>52</volume>
          <issue>2</issue>
          <fpage>571</fpage>
          <lpage>601</lpage>
          <pub-id pub-id-type="doi">10.1007/s10579-017-9382-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamon</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Grabar</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Tuning HeidelTime for identifying time expressions in clinical texts in English and French</article-title>
          <year>2014</year>
          <conf-name>LOUHI 2014 - Proceedings of the 5th International Workshop on Health Text Mining and Information Analysis @ EACL 2014</conf-name>
          <conf-date>2014 April 27</conf-date>
          <conf-loc>Gothenburg, Sweden</conf-loc>
          <fpage>101</fpage>
          <lpage>105</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/w14-1116</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bannour</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Rance</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tannier</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Névéol</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Event-independent temporal positioning: application to French clinical text</article-title>
          <year>2023</year>
          <conf-name>BioNLP 2023 - Proceedings of the 22nd Workshop on Biomedical Language Processing (BioNLP) &#38; BioNLP Shared Tasks (BioNLP-ST) @ ACL 2023</conf-name>
          <conf-date>2023 July 13</conf-date>
          <conf-loc>Ontario, Canada</conf-loc>
          <fpage>191</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2023.bionlp-1.16</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jeyafreeda</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Vincent</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Burgun</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garcelon</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Evaluating LLMs for temporal entity extraction from pediatric clinical text in rare diseases context</article-title>
          <year>2024</year>
          <conf-name>CL4Health 2024 - Proceedings of the 1st Workshop on Patient-Oriented Language Processing @ LREC-COLING 2024</conf-name>
          <conf-date>2024 May 20</conf-date>
          <conf-loc>Torino, Italia</conf-loc>
          <fpage>145</fpage>
          <lpage>152</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2024.cl4health-1.18/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Temporal indexing of medical entity in Chinese clinical notes</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <volume>19</volume>
          <issue>Suppl 1</issue>
          <fpage>17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0735-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0735-x</pub-id>
          <pub-id pub-id-type="medline">30700331</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0735-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC6354334</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Temporal expression classification and normalization from Chinese narrative clinical texts: pattern learning approach</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>7</issue>
          <fpage>e17652</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/7/e17652/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17652</pub-id>
          <pub-id pub-id-type="medline">32716307</pub-id>
          <pub-id pub-id-type="pii">v8i7e17652</pub-id>
          <pub-id pub-id-type="pmcid">PMC7418025</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>CMedTEX: a rule-based temporal expression extraction and normalization system for Chinese clinical notes</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>818</fpage>
          <lpage>826</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28269878"/>
          </comment>
          <pub-id pub-id-type="medline">28269878</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333232</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Knowledge representation and reasoning for complex time expression in clinical text</article-title>
          <source>Data Intell</source>
          <year>2022</year>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>573</fpage>
          <lpage>598</lpage>
          <pub-id pub-id-type="doi">10.1162/dint_a_00152</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Velupillai</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Temporal expressions in Swedish medical text: a pilot study</article-title>
          <year>2014</year>
          <conf-name>BioNLP 2014 - Proceedings of the Workshop on Biomedical Natural Language Processing @ ACL 2014</conf-name>
          <conf-date>2024 June 27</conf-date>
          <conf-loc>Baltimore, Maryland, USA</conf-loc>
          <fpage>88</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/w14-3413</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Azevedo</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Santos Rodrigues</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>da Silva Reis</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Cabral Moro</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Cabrera Paraiso</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Temporal tagging of noisy clinical texts in Brazilian Portuguese</article-title>
          <source>Computational Processing of the Portuguese Language</source>
          <year>2018</year>
          <conf-name>PROPOR 2018 - Proceedings of the 13th International Conference on Computational Processing of the Portuguese Language</conf-name>
          <conf-date>2018 Sep 24</conf-date>
          <conf-loc>Canela, Brazil</conf-loc>
          <fpage>231</fpage>
          <lpage>241</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-99722-3_24</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Viani</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Napolitano</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Priori</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Bellazzi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sacchi</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Supervised methods to extract clinical events from cardiology reports in Italian</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <volume>95</volume>
          <fpage>103219</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30139-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103219</pub-id>
          <pub-id pub-id-type="medline">31150777</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30139-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC6948016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yada</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aramaki</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kurohashi</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>JaMIE: a pipeline Japanese medical information extraction system with novel relation annotation</article-title>
          <year>2022</year>
          <conf-name>LREC 2022 - Proceedings of the 13th International Conference on Language Resources and Evaluation</conf-name>
          <conf-date>2022 June 20</conf-date>
          <conf-loc>Marseille, France</conf-loc>
          <fpage>3724</fpage>
          <lpage>3731</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2022.lrec-1.397/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kanashiro</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Yada</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aramaki</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>QA-based event start-points ordering for clinical temporal relation annotation</article-title>
          <year>2024</year>
          <conf-name>LREC-COLING 2024 - Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation</conf-name>
          <conf-date>2024 May 20</conf-date>
          <conf-loc>Torino, Italia</conf-loc>
          <fpage>13371</fpage>
          <lpage>13381</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2024.lrec-main.1171/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magnini</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Altuna</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lavelli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Minard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Speranza</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zanoli</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Rehm</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>European clinical case corpus</article-title>
          <source>European Language Grid: a Language Technology Platform for Multilingual Europe</source>
          <year>2023</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>283</fpage>
          <lpage>288</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Matthies</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lohr</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Löffler</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>3000PA-towards a national reference corpus of German clinical language</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2018</year>
          <volume>247</volume>
          <fpage>26</fpage>
          <lpage>30</lpage>
          <pub-id pub-id-type="medline">29677916</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lohr</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Luther</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matthies</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Modersohn</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ammon</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Saleh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Henkel</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Kiehntopf</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>CDA-compliant section annotation of German-language discharge summaries: guideline development, annotation campaign, section classification</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>770</fpage>
          <lpage>779</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30815119"/>
          </comment>
          <pub-id pub-id-type="medline">30815119</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371337</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kolditz</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lohr</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hellrich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Modersohn</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Betz</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kiehntopf</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Annotating German clinical documents for de-identification</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <volume>264</volume>
          <fpage>203</fpage>
          <lpage>207</lpage>
          <pub-id pub-id-type="doi">10.3233/shti190212</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lohr</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Modersohn</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hellrich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kolditz</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>An evolutionary approach to the annotation of discharge summaries</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2020</year>
          <volume>270</volume>
          <fpage>28</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.3233/shti200116</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Modersohn</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schulz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lohr</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>GraSCCo: the first publicly shareable, multiply-alienated German clinical text corpus</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2022</year>
          <volume>270</volume>
          <fpage>66</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.3233/shti220805</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schulz</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>GraSCCo</article-title>
          <source>Zenodo (CERN European Organization for Nuclear Research)</source>
          <year>2022</year>
          <access-date>2025-08-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.5281/zenodo.6539131">https://doi.org/10.5281/zenodo.6539131</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kweon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Im</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bae</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Baek</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Jo</surname>
              <given-names>YB</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Publicly shareable clinical large language model built on synthetic clinical notes</article-title>
          <year>2024</year>
          <conf-name>Findings of the Association for Computational Linguistics - ACL 2024</conf-name>
          <conf-date>2024 Aug 11</conf-date>
          <conf-loc>Bangkok, Thailand</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>5148</fpage>
          <lpage>5168</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2024.findings-acl.305</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>SVS</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Are synthetic clinical notes useful for real natural language processing tasks: a case study on clinical entity recognition</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>10</issue>
          <fpage>2193</fpage>
          <lpage>2201</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34272955"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocab112</pub-id>
          <pub-id pub-id-type="medline">34272955</pub-id>
          <pub-id pub-id-type="pii">6323280</pub-id>
          <pub-id pub-id-type="pmcid">PMC8449609</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ive</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Viani</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kam</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Puntis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cardinal</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Velupillai</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Generation and evaluation of artificial mental health records for natural language processing</article-title>
          <source>NPJ Digit Med</source>
          <year>2020</year>
          <volume>3</volume>
          <issue>69</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-020-0267-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-020-0267-x</pub-id>
          <pub-id pub-id-type="medline">32435697</pub-id>
          <pub-id pub-id-type="pii">267</pub-id>
          <pub-id pub-id-type="pmcid">PMC7224173</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hiebel</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ferret</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Fort</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Névéol</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Can synthetic text help clinical named entity recognition? a study of electronic health records in French</article-title>
          <year>2023</year>
          <conf-name>EACL 2023 - Proceedings of the 17th Conference of the European Chapter of the Association for Computational Linguistics</conf-name>
          <conf-date>2023 May 06</conf-date>
          <conf-loc>Dubrovnik, Croatia</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>2320</fpage>
          <lpage>2338</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2023.eacl-main.170</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brekke</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Rama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pilán</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nytrø</surname>
              <given-names>Ø</given-names>
            </name>
            <name name-style="western">
              <surname>Øvrelid</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Synthetic data for annotation and extraction of family history information from clinical text</article-title>
          <source>J Biomed Semantics</source>
          <year>2021</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>11</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/s13326-021-00244-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13326-021-00244-2</pub-id>
          <pub-id pub-id-type="medline">34261535</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13326-021-00244-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8278746</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pustejovsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stubbs</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>Natural Language Annotation for Machine Learning - A Guide to corpus-building for Applications</source>
          <year>2012</year>
          <publisher-loc>California</publisher-loc>
          <publisher-name>O'Reilly Media, Inc</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Artstein</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Poesio</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Inter-coder agreement for computational linguistics</article-title>
          <source>Comput Linguist</source>
          <year>2008</year>
          <volume>34</volume>
          <issue>4</issue>
          <fpage>555</fpage>
          <lpage>596</lpage>
          <pub-id pub-id-type="doi">10.1162/coli.07-034-R2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kolditz</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Bratiaa: inter-annotator agreement for brat annotation projects</article-title>
          <source>GitHub</source>
          <year>2019</year>
          <access-date>2025-08-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/kldtz/bratiaa">https://github.com/kldtz/bratiaa</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reimers</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dehghani</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gurevych</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Temporal anchoring of events for the TIMEBANK corpus</article-title>
          <year>2016</year>
          <conf-name>ACL 2016 - Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>2016 Aug 07</conf-date>
          <conf-loc>Berlin, Germany</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>2195</fpage>
          <lpage>2204</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/p16-1207</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verhagen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Temporal closure in an annotation environment</article-title>
          <source>Language Res Eval</source>
          <year>2006</year>
          <volume>39</volume>
          <issue>2-3</issue>
          <fpage>211</fpage>
          <lpage>241</lpage>
          <pub-id pub-id-type="doi">10.1007/s10579-005-7884-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stenetorp</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pyysalo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Topi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ohta</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tsujii</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BRAT: a Web-based tool for NLP-assisted text annotation</article-title>
          <year>2012</year>
          <conf-name>EACL 2012 - Proceedings of the 13th Conference of the European Chapter of the Association for Computational Linguistics: Demonstrations</conf-name>
          <conf-date>2012 Apr 25</conf-date>
          <conf-loc>Avignon, France</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>25</fpage>
          <lpage>26</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/E12-2021/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Schweter</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Möller</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>German's next language model</article-title>
          <year>2020</year>
          <conf-name>COLING 2020 - Proceedings of the 28th International Conference on Computational Linguistics</conf-name>
          <conf-date>2020 Dec 08</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <publisher-name>International Committee on Computational Linguistics (ICCL)</publisher-name>
          <fpage>6788</fpage>
          <lpage>6796</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.coling-main.598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Falkner</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hutter</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>BOHB: robust and efficient hyperparameter optimization at scale</article-title>
          <year>2018</year>
          <conf-name>ICML 2018 - Proceedings of the 35th International Conference on Machine Learning</conf-name>
          <conf-date>2018 July 10</conf-date>
          <conf-loc>Stockholm, Sweden</conf-loc>
          <publisher-name>Proceedings of Machine Learning Research</publisher-name>
          <fpage>1437</fpage>
          <lpage>1446</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://proceedings.mlr.press/v80/falkner18a.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref97">
        <label>97</label>
        <nlm-citation citation-type="web">
          <article-title>Huggingface: Huggingface/Transformers</article-title>
          <source>GitHub</source>
          <year>2020</year>
          <access-date>2025-08-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/huggingface/transformers">https://github.com/huggingface/transformers</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref98">
        <label>98</label>
        <nlm-citation citation-type="web">
          <article-title>Microsoft: neural network intelligence</article-title>
          <source>GitHub</source>
          <year>2021</year>
          <access-date>2025-08-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/microsoft/nni">https://github.com/microsoft/nni</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref99">
        <label>99</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Durrett</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Embedding time expressions for deep temporal ordering models</article-title>
          <year>2019</year>
          <conf-name>ACL 2019 - Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>2019 Aug 02</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>4400</fpage>
          <lpage>4406</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/p19-1433</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref100">
        <label>100</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Han</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tresp</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Time-dependent entity embedding is not all you need: a re-evaluation of temporal knowledge graph completion models under a unified framework</article-title>
          <year>2021</year>
          <conf-name>EMNLP 2021 - Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>2021 Nov 07</conf-date>
          <conf-loc>Punta Cana, Dominican Republic</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>8104</fpage>
          <lpage>8118</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2021.emnlp-main.639</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref101">
        <label>101</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qiao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Learning joint structural and temporal contextualized knowledge embeddings for temporal knowledge graph completion</article-title>
          <year>2023</year>
          <conf-name>Findings of the Association for Computational Linguistics - ACL 2023</conf-name>
          <conf-date>2023 July 09</conf-date>
          <conf-loc>Toronto, Ontario, Canada</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>417</fpage>
          <lpage>430</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2023.findings-acl.28</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref102">
        <label>102</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mathur</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dernoncourt</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Morariu</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>QH</given-names>
            </name>
            <name name-style="western">
              <surname>Manocha</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>TIMERS: document-level temporal relation extraction</article-title>
          <year>2021</year>
          <conf-name>ACL-IJCNLP 2021 - Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics &#38; 11th International Joint Conference on Natural Language Processing</conf-name>
          <conf-date>2021 Aug 01</conf-date>
          <conf-loc>Stroudsburg, PA</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>524</fpage>
          <lpage>533</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2021.acl-short.67</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref103">
        <label>103</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Document-level relation extraction with two-stage dynamic graph attention networks</article-title>
          <source>Knowl Based Syst</source>
          <year>2023</year>
          <volume>267</volume>
          <fpage>110428</fpage>
          <pub-id pub-id-type="doi">10.1016/j.knosys.2023.110428</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref104">
        <label>104</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wehbe</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A comparative study of pretrained language models for long clinical text</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2023</year>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>340</fpage>
          <lpage>347</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36451266"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocac225</pub-id>
          <pub-id pub-id-type="medline">36451266</pub-id>
          <pub-id pub-id-type="pii">6855145</pub-id>
          <pub-id pub-id-type="pmcid">PMC9846675</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref105">
        <label>105</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gaizauskas</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hepple</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Demetriou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kola</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Setzer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tapuria</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wheeldin</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The CLEF corpus: semantic annotation of clinical text</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2007</year>
          <volume>2007</volume>
          <fpage>625</fpage>
          <lpage>629</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/18693911"/>
          </comment>
          <pub-id pub-id-type="medline">18693911</pub-id>
          <pub-id pub-id-type="pmcid">PMC2655900</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref106">
        <label>106</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raghavan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fosler-Lussier</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Inter-annotator reliability of medical events, coreferences and temporal relations in clinical narratives by annotators with varying levels of clinical expertise</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2012</year>
          <volume>2012</volume>
          <fpage>1366</fpage>
          <lpage>1374</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23304416"/>
          </comment>
          <pub-id pub-id-type="medline">23304416</pub-id>
          <pub-id pub-id-type="pmcid">PMC3540452</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref107">
        <label>107</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bastardo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pavão</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Ramos</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A timeline model for clinical events: empowering data</article-title>
          <source>Procedia Comput Sci</source>
          <year>2022</year>
          <volume>196</volume>
          <fpage>1053</fpage>
          <lpage>1058</lpage>
          <pub-id pub-id-type="doi">10.1016/j.procs.2021.12.109</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref108">
        <label>108</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hummer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ocal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>PYTLEX : A PYTHON library for TimeLine extraction</article-title>
          <year>2024</year>
          <conf-name>EACL 2024 - Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics: System Demonstrations</conf-name>
          <conf-date>2024 March 17</conf-date>
          <conf-loc>St. Julian's, Malta</conf-loc>
          <publisher-name>Association for Computational Linguistics (ACL)</publisher-name>
          <fpage>27</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2024.eacl-demo.4</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
