<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="research-article">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">NHESS</journal-id><journal-title-group>
    <journal-title>Natural Hazards and Earth System Sciences</journal-title>
    <abbrev-journal-title abbrev-type="publisher">NHESS</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Nat. Hazards Earth Syst. Sci.</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1684-9981</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/nhess-26-2609-2026</article-id><title-group><article-title>Wikimpacts 1.0: a new global climate impact database based on automated information extraction from Wikipedia</article-title><alt-title>Wikimpacts 1.0</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes" rid="aff1 aff2">
          <name><surname>Li</surname><given-names>Ni</given-names></name>
          <email>ni.li@vub.be</email>
        <ext-link>https://orcid.org/0009-0000-4260-5284</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Thiery</surname><given-names>Wim</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-5183-6145</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3 aff6 aff7">
          <name><surname>Zahra</surname><given-names>Shorouq</given-names></name>
          
        <ext-link>https://orcid.org/0009-0007-2792-9345</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4">
          <name><surname>Madruga de Brito</surname><given-names>Mariana</given-names></name>
          
        <ext-link>https://orcid.org/0000-0003-4191-1647</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5 aff6">
          <name><surname>Worou</surname><given-names>Koffi</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-2230-8431</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3 aff7">
          <name><surname>Kurfalı</surname><given-names>Murathan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Lampe</surname><given-names>Seppe</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-7907-4496</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff12">
          <name><surname>Muñoz</surname><given-names>Paul</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-8000-8840</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5 aff6">
          <name><surname>Flynn</surname><given-names>Clare</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Trigoso</surname><given-names>Camila</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3 aff6 aff8">
          <name><surname>Nivre</surname><given-names>Joakim</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2 aff9 aff10">
          <name><surname>Zscheischler</surname><given-names>Jakob</given-names></name>
          
        <ext-link>https://orcid.org/0000-0001-6045-1629</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff5 aff6 aff11">
          <name><surname>Messori</surname><given-names>Gabriele</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-2032-5211</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>Department of Water and Climate, Vrije Universiteit Brussel, Brussels, Belgium</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>Department of Hydro Sciences, TUD Dresden University of Technology, Dresden, Germany</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>RISE Research Institutes of Sweden, Sweden</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>Department of Urban and Environmental Sociology, Helmholtz Centre for Environmental  Research – UFZ, Leipzig, Germany</institution>
        </aff>
        <aff id="aff5"><label>5</label><institution>Department of Earth Sciences, Uppsala University, Uppsala, Sweden</institution>
        </aff>
        <aff id="aff6"><label>6</label><institution>Swedish centre for impacts of climate extremes (climes), Uppsala University, Uppsala, Sweden</institution>
        </aff>
        <aff id="aff7"><label>7</label><institution>Swedish centre for impacts of climate extremes (climes), RISE, Stockholm, Sweden</institution>
        </aff>
        <aff id="aff8"><label>8</label><institution>Department of Linguistics and Philology, Uppsala University, Uppsala, Sweden</institution>
        </aff>
        <aff id="aff9"><label>9</label><institution>Department of Compound Environmental Risks, Helmholtz Centre for Environmental Research – UFZ, Leipzig, Germany</institution>
        </aff>
        <aff id="aff10"><label>10</label><institution>Center for Scalable Data Analytics and Artificial Intelligence (ScaDS.AI), Dresden/Leipzig, Germany</institution>
        </aff>
        <aff id="aff11"><label>11</label><institution>Department of Meteorology, Stockholm University, Stockholm, Sweden</institution>
        </aff>
        <aff id="aff12"><label>12</label><institution>Departamento de Recursos Hídricos, Universidad de Concepción, 3812120, Chillán, Chile</institution>
        </aff>
      </contrib-group>
      <author-notes><corresp id="corr1">Ni Li (ni.li@vub.be)</corresp></author-notes><pub-date><day>4</day><month>June</month><year>2026</year></pub-date>
      
      <volume>26</volume>
      <issue>6</issue>
      <fpage>2609</fpage><lpage>2636</lpage>
      <history>
        <date date-type="received"><day>2</day><month>October</month><year>2025</year></date>
           <date date-type="rev-request"><day>29</day><month>October</month><year>2025</year></date>
           <date date-type="rev-recd"><day>10</day><month>April</month><year>2026</year></date>
           <date date-type="accepted"><day>21</day><month>April</month><year>2026</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 Ni Li et al.</copyright-statement>
        <copyright-year>2026</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026.html">This article is available from https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026.html</self-uri><self-uri xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026.pdf">The full text article is available as a PDF file from https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e269">Climate extremes like storms, heatwaves, wildfires, droughts and floods significantly threaten society and ecosystems. However, comprehensive data on the socio-economic impacts of climate extremes remains limited. Here we present Wikimpacts 1.0, a global climate impact database built by extracting information from Wikipedia using natural language processing. Our method identifies relevant articles, extracts the information using GPT4o, post-processes the information and consolidates the database. Impact data is stored at the event, national, and sub-national levels, covering 2726 events from 1034 to 2024, with 17 912 national and 32 343 sub-national entries. The database shows low error scores (range from 0 to 1) for event-level information like timing (0.05), deaths (0.03), and economic damage (0.12), and slightly higher error scores for injuries (0.21), homelessness (0.25), displacement (0.29), and damaged buildings (0.28) compared to manually annotated data from 156 events. Wikimpacts 1.0 provides a different event coverage than EM-DAT, notably providing broader coverage of storm impacts but more limited coverage of flood impacts. We match 179 events between the two databases to compare impact values, and find that 32 out of 179 matched events have identical data for deaths, and 7 out of 77 for injuries. However, there are notable discrepancies in information on homelessness and damage. We view the publicly available Wikimpacts 1.0 database as a complementary resource to existing impact databases, which facilitates subnational climate impact assessments, and highlights the potential of natural language processing to enhance existing impact datasets and provide robust information on climate impacts. Lastly, we provide a static version of the database as used in this paper at <uri>https://bolin.su.se/data/li-2025-wikimpacts-1.0.final</uri> (last access: 20 May 2026) and the Wikimpacts website (<uri>https://www.wikimpacts.eu/</uri>, last access: 20 May 2026) for visualization and access for future updates of the database.</p>
  </abstract>
    
<funding-group>
<award-group id="gs1">
<funding-source>HORIZON EUROPE European Research Council</funding-source>
<award-id>101124572</award-id>
<award-id>101112727</award-id>
</award-group>
<award-group id="gs2">
<funding-source>Vetenskapsrådet</funding-source>
<award-id>2022-06599</award-id>
<award-id>2022-03448</award-id>
</award-group>
</funding-group>
</article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e287">Climate extremes – such as storms, heatwaves, wildfires, floods, and droughts – cause substantial impacts to society, often leading to large losses of life and property. These consequences are expected to exacerbate in the future due to the ongoing climate and land-use changes <xref ref-type="bibr" rid="bib1.bibx42 bib1.bibx3" id="paren.1"/>. Climate change has already led to an increase in the frequency, intensity, duration and geographical extent of many climate-related extreme events, a trend projected to continue in the coming decades <xref ref-type="bibr" rid="bib1.bibx42 bib1.bibx22 bib1.bibx47 bib1.bibx32" id="paren.2"/>. A comprehensive understanding of the impacts of extreme climate events is crucial for improving impact forecasting, impact projections, early warning systems, and managing disaster risks <xref ref-type="bibr" rid="bib1.bibx46 bib1.bibx7 bib1.bibx19 bib1.bibx71" id="paren.3"/>. For example, accurate and geographically-resolved impact data is essential for pinpointing areas that are disproportionately affected by climate extremes <xref ref-type="bibr" rid="bib1.bibx17" id="paren.4"/>, allowing for targeted allocation of climate adaptation efforts. Climate impact data can also be used to assess the effectiveness of adaptation measures in reducing loss and damage from climate extremes <xref ref-type="bibr" rid="bib1.bibx21" id="paren.5"/>.</p>
      <p id="d2e305">However, currently available climate impact data suffer from a number of limitations. Many global impact databases are proprietary, and not openly available for researchers. Examples include Munich Re's NatCatSERVICE (<ext-link xlink:href="https://www.munichre.com/en/solutions/for-industry-clients/natcatservice.html">https://www.munichre.com/en/solutions/for-industry</ext-link> <ext-link xlink:href="https://www.munichre.com/en/solutions/for-industry-clients/natcatservice.html">-clients/natcatservice.html</ext-link>, last access: 20 May 2026), Swiss Re's Sigma (<uri>https://www.sigma-explorer.com/</uri>, last access: 20 May 2026), and PERILS AG's PERILS (<uri>https://www.perils.org/products/industry-exposure-and-loss-database</uri>, last access: 20 May 2026), originating from the insurance sector. The data in existing open-access global climate impact databases suffer from incompleteness, inconsistencies, and/or biases <xref ref-type="bibr" rid="bib1.bibx18 bib1.bibx49 bib1.bibx37 bib1.bibx30 bib1.bibx29" id="paren.6"/>. One of the most widely used open databases for climate extreme event impact studies is EM-DAT (CRED, <uri>https://www.emdat.be/</uri>, last access: 20 May 2026) <xref ref-type="bibr" rid="bib1.bibx10" id="paren.7"/>. Although EM-DAT is a valuable database, its use for systematic climate impact studies presents several challenges. Researchers have attempted to geolocate disaster events from EM-DAT, yet the resulting data comes with limited temporal coverage (e.g., events from 1960 to 2018, in GDIS data, <xref ref-type="bibr" rid="bib1.bibx40" id="altparen.8"/>) and include some geoparsing errors <xref ref-type="bibr" rid="bib1.bibx70 bib1.bibx27 bib1.bibx45" id="paren.9"/>. Although the geoparsing errors for EM-DAT events from 1990–2023 are handled in a new geocoded database, Geo-Disasters <xref ref-type="bibr" rid="bib1.bibx45" id="paren.10"/>, mapping the aggregated impact from national level to subnational scales remains challenging <xref ref-type="bibr" rid="bib1.bibx40 bib1.bibx10" id="paren.11"/>. Moreover, the level of administrative divisions used in the latter databases varies between countries, and administrative units at the same level can also be highly variable due to the differing resolutions across and within countries, which complicates implementation of damage functions in impact assessment studies <xref ref-type="bibr" rid="bib1.bibx13 bib1.bibx28" id="paren.12"/>. Similarly, temporal information in EM-DAT can be inconsistently documented as a range of days, months, or a single year. Furthermore, when a single physical event has a wide-ranging influence, it may be documented under multiple entries <xref ref-type="bibr" rid="bib1.bibx14" id="paren.13"/>. In addition, the number of events in both developed and underdeveloped countries is likely under-reported <xref ref-type="bibr" rid="bib1.bibx18" id="paren.14"/>. For reported events, there are substantial missing entries in the predefined impact categories, particularly those pertaining to economic losses <xref ref-type="bibr" rid="bib1.bibx20" id="paren.15"/>. Because impact entries are categorized based on a single primary hazard, impacts from co-occurring hazards such as droughts and heatwaves <xref ref-type="bibr" rid="bib1.bibx72" id="paren.16"/> or other multi-hazard events may not be fully captured <xref ref-type="bibr" rid="bib1.bibx23 bib1.bibx29" id="paren.17"/>. Similar limitations also affect other global multi-hazard impact databases, such as DesInventar <xref ref-type="bibr" rid="bib1.bibx50" id="paren.18"/>. While single-hazards databases (e.g. <xref ref-type="bibr" rid="bib1.bibx38 bib1.bibx39 bib1.bibx15" id="altparen.19"/>; IFNet Tokyo, <uri>http://www.internationalfloodnetwork.org/index.html</uri>, last access: 20 May 2026; DFO USA, <ext-link xlink:href="https://floodobservatory.colorado.edu/wiki/Main_Page">https://floodobserva</ext-link> <ext-link xlink:href="https://floodobservatory.colorado.edu/wiki/Main_Page">tory.colorado.edu/wiki/Main_Page</ext-link>, last access: 20 May 2026; WISC EU, <ext-link xlink:href="https://climate.copernicus.eu/windstorm-information-service">https://climate.copernicus.eu/windstorm</ext-link>
<ext-link xlink:href="https://climate.copernicus.eu/windstorm-information-service">-information-service</ext-link>, last access: 20 May 2026), and databases focusing on national spatial scales <xref ref-type="bibr" rid="bib1.bibx43 bib1.bibx8" id="paren.20"><named-content content-type="pre">e.g.,</named-content></xref> have better coverage and completeness, they are generally difficult to expand to multiple hazards or other regions. Furthermore, they all use different impact categories and event definitions, hindering cross-database multi-hazard impact analyses. Lastly, many multi-hazard global databases, as well as single-hazard or national databases, are developed manually by small teams of researchers, which makes timely updates difficult. The manual process also limits traceability of information, making it difficult to link a given entry to a specific data source.</p>
      <p id="d2e392">An alternative source of information on impacts from climate and weather extremes comes from digitalised textual records such as newspaper archives <xref ref-type="bibr" rid="bib1.bibx6 bib1.bibx11 bib1.bibx44 bib1.bibx1" id="paren.21"/> and Twitter <xref ref-type="bibr" rid="bib1.bibx9" id="paren.22"/>. These data can overcome some of the shortcomings of existing impact databases. They provide detailed impact records, which are typically associated with specific dates and locations. Despite the widespread digitalisation of text and the wealth of quantitative information available on impactful climate events, there is currently no global, multi-hazard, open and traceable climate impact database leveraging freely available online textual sources. Here, we present one such database: the accompanying Wikimpacts 1.0 dataset <xref ref-type="bibr" rid="bib1.bibx25" id="paren.23"/>.</p>
      <p id="d2e404">Wikimpacts 1.0 addresses some of the aforementioned database limitations, by providing extensive spatio-temporal coverage (within the scope of Wikipedia), standardized temporal, spatial, and impact information, and ease of updating for new events. Our framework implements an automated, end-to-end pipeline for extracting and processing impact information from the sub-national up to the event level, thereby enabling multi-scale climate impact assessment studies. Our automated multi-step pipeline extracts semi-structured data from English Wikipedia articles by utilizing GPT4o, a pre-trained Large Language Model (LLM). The data then undergoes a post-processing step in which different data points are refined, normalized, and stored in a relational database. As such, this database aims to reflect the information available in Wikipedia as accurately as possible, without evaluating the reliability of the underlying information in the articles. Geo-parsing is a crucial step in our post-processing to connect place names to geographical entities and boost the database's usability for research. The Wikimpacts database is designed to complement existing global disaster impact databases such as EM-DAT and DesInventar, notably by providing georeferenced information at subnational level. Although the inclusion criteria and event definitions differ across databases, matching events by type, date, and location allows us to identify a set of shared events that can be jointly analysed. These overlapping records can support global multi-hazard comparisons and sub-national studies, particularly when combined with climate and other geospatial data. We chose to rely solely on English Wikipedia articles in the Wikimpacts 1.0 database, since we find relatively few climate event articles in other languages that are not also reported in English. We thus do not view the English reporting bias as a main issue. We however acknowledge that regions with limited Wikipedia activity and small or highly localized events are likely to be under-reported. Consequently, the Wikimpacts 1.0 database should not be used in isolation for complete or sensitive national loss assessments. For such applications, we recommend benchmarking Wikimpacts against other existing databases and officially reported government statistics.</p>
      <p id="d2e408">This database has been developed in compliance with Article 3 of Directive (EU) 2019/790 regarding copyright and related rights within the Digital Single Market, utilizing lawful text and text mining techniques. The data encompassed within this database is derived from automated extraction and synthesis of information from legally accessible sources, including publicly available Wikipedia articles. The dataset exclusively comprises factual information (e.g., temporal data, geographic locations, event types, reported impacts) and does not replicate any protected expressions or copyrighted material from the original sources.</p>
      <p id="d2e411">The remainder of this paper is organized as follows. Section 2, <italic>Database Structure</italic>, presents an overview of the database design and the technical definitions of all fields. Section 3, <italic>Wikimpacts Processing Pipeline</italic>, describes in detail the methodology used to construct the database, while Sect. 4, <italic>Evaluation of the Pipeline</italic>, reports the evaluation methods and results. Section 5, <italic>Wikimpacts 1.0: Content of the Database</italic>, presents the spatial and temporal distribution of the database content and compares it with EM-DAT. Section 6, <italic>Discussion</italic>, provides a detailed assessment of the pipeline and database, a comparison with EM-DAT, and presents the limitations of the database. Finally, Sect. 7, <italic>Conclusion</italic>, summarizes the main contributions of this work.</p>
</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Database Structure</title>
      <p id="d2e442">To ensure ease of use, Wikimpacts 1.0 adopts impact categories similar to those used in existing disaster databases, such as EM-DAT. Table <xref ref-type="table" rid="T1"/> provides a detailed description of the information recorded in our database. We classify all events recorded in the database into 7 categories, hereafter referred to as Main Events, and subsequently assign one or more hazards to each main event category (see Table <xref ref-type="table" rid="T2"/>). Table <xref ref-type="table" rid="T3a"/> further details the technical specifications for all fields in our database. The database provides impact information at three levels: event level (L1), national level (L2), and sub-national level (L3). L1 provides the total impacts associated with a given main event across all affected countries; L2 provides the national-level impacts, and is the same as L1 if the event affected a single country; and L3 includes impacts at the smallest available sub-national locations within each affected country. The location-related information is summarized in Table <xref ref-type="table" rid="T1"/>. For L1 and L2, the locations are specified in Administrative_Areas_Norm, which contains a list of affected countries. For L3, the location information comprises both Administrative_Areas_Norm and Locations_Norm, indicating one affected country and a list of affected sub-locations such as provinces or cities. In the remainder of the text, we use the general term “location” or “locations” to refer to both these fields. This structure is exemplified in Fig. <xref ref-type="fig" rid="F1"/> for deaths caused by the severe flooding episode that affected parts of Western Europe in 2021. The L1 information is the total number of deaths across all countries affected by the event. L2 provides a breakdown of the number of deaths by country e.g., 196 deaths in Germany. L3 further details the number of deaths at a sub-national level, specifying either point locations (e.g., cities) or polygons (e.g., provinces). This is shown as an example for the city of Pepinster (point) and for the German state of Bavaria (polygon); the full deaths information for the 2021 European Floods can be found in Sect. S1 in the Supplement. In relation to the 2021 European flood event, the information on fatalities recorded in Wikipedia has been updated as of 2024 since it was accessed to construct the database and indicates 196 deaths in Germany, 39 in Belgium, 2 in Romania, and 1 each in Italy and Austria as of 2025 (information manually extracted on 15 January 2026).</p>

<table-wrap id="T1" specific-use="star"><label>Table 1</label><caption><p id="d2e458">List of the information included in the Wikimpacts 1.0 database and their definitions.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="3">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Information Type</oasis:entry>
         <oasis:entry colname="col2">Field</oasis:entry>
         <oasis:entry colname="col3">Definition</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Basic</oasis:entry>
         <oasis:entry colname="col2">Event_ID</oasis:entry>
         <oasis:entry colname="col3">Unique event identifier, consistent across levels L1–L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Basic</oasis:entry>
         <oasis:entry colname="col2">Sources</oasis:entry>
         <oasis:entry colname="col3">Original Wikipedia link(s) of the event.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Basic</oasis:entry>
         <oasis:entry colname="col2">Event_Names</oasis:entry>
         <oasis:entry colname="col3">Name(s) of the event.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Basic</oasis:entry>
         <oasis:entry colname="col2">Main_Event</oasis:entry>
         <oasis:entry colname="col3">Unique categorisation of the event at L1 (see Table <xref ref-type="table" rid="T2"/>).</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Basic</oasis:entry>
         <oasis:entry colname="col2">Hazards</oasis:entry>
         <oasis:entry colname="col3">Hazards associated with the Main_Event at L1, which refer to the potential occurrence of physical</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">phenomena that may cause impacts (see Table <xref ref-type="table" rid="T2"/>).</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Time-related</oasis:entry>
         <oasis:entry colname="col2">Start_Date_Day</oasis:entry>
         <oasis:entry colname="col3">Start day of the event at L1, or start day of the impact recorded at L2/L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Time-related</oasis:entry>
         <oasis:entry colname="col2">Start_Date_Month</oasis:entry>
         <oasis:entry colname="col3">Start month of the event at L1, or start month of the impacts recorded at L2/L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Time-related</oasis:entry>
         <oasis:entry colname="col2">Start_Date_Year</oasis:entry>
         <oasis:entry colname="col3">Start year of the event at L1, or start year of the impacts recorded at L2/L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Time-related</oasis:entry>
         <oasis:entry colname="col2">End_Date_Day</oasis:entry>
         <oasis:entry colname="col3">End day of the event at L1, or end day of the impacts recorded at L2/L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Time-related</oasis:entry>
         <oasis:entry colname="col2">End_Date_Month</oasis:entry>
         <oasis:entry colname="col3">End month of the event at L1, or end month of the impacts recorded at L2/L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Time-related</oasis:entry>
         <oasis:entry colname="col2">End_Date_Year</oasis:entry>
         <oasis:entry colname="col3">End year of the event at L1, or end year of the impacts recorded at L2/L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Areas_Norm</oasis:entry>
         <oasis:entry colname="col3">Affected countries from GADM at L1/L2.</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Areas_Type</oasis:entry>
         <oasis:entry colname="col3">Administrative types of affected countries from OpenStreetMap (OSM), United Nations Statistics</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">Division (UNSD), or Global Administrative Unit Layers (GAUL 2015) at L1/L2.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Areas_GeoJSON</oasis:entry>
         <oasis:entry colname="col3">GeoJSON format of the affected countries at L1/L2.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Areas_GID</oasis:entry>
         <oasis:entry colname="col3">GADM Global Administrative Areas IDs of the affected countries at L1/L2.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Area_Norm</oasis:entry>
         <oasis:entry colname="col3">Affected country at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Area_Type</oasis:entry>
         <oasis:entry colname="col3">Administrative type of affected country from OSM , UNSD, or GAUL 2015 at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Area_GeoJSON</oasis:entry>
         <oasis:entry colname="col3">GeoJSON format of the affected country at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Administrative_Area_GID</oasis:entry>
         <oasis:entry colname="col3">GADM Global Administrative Areas ID of the affected country at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Locations_Norm</oasis:entry>
         <oasis:entry colname="col3">Affected sub-national area names at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Locations_Type</oasis:entry>
         <oasis:entry colname="col3">Affected sub-national types from OSM at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Locations_GeoJson</oasis:entry>
         <oasis:entry colname="col3">GeoJSON format of the affected sub-national areas at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Location-related</oasis:entry>
         <oasis:entry colname="col2">Locations_GID</oasis:entry>
         <oasis:entry colname="col3">GADM Global Administrative Areas IDs of the affected sub-national areas at L3.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Deaths</oasis:entry>
         <oasis:entry colname="col3">The number of deaths in the event. Missing people are not included as deaths.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Injuries</oasis:entry>
         <oasis:entry colname="col3">The number of non-fatal injuries in the event.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Homeless</oasis:entry>
         <oasis:entry colname="col3">The number of people made homeless by the event.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Displaced</oasis:entry>
         <oasis:entry colname="col3">The number of people displaced by the event.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Affected</oasis:entry>
         <oasis:entry colname="col3">The number of people affected by the event.</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Buildings_Damaged</oasis:entry>
         <oasis:entry colname="col3">The number of buildings damaged by the event.</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Insured_Damage</oasis:entry>
         <oasis:entry colname="col3">Damage from physical harm or loss to property, assets, or individuals covered under an insurance</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">policy in the event.</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Impact-related</oasis:entry>
         <oasis:entry colname="col2">Damage</oasis:entry>
         <oasis:entry colname="col3">The economic damage caused by the event.</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

<table-wrap id="T2"><label>Table 2</label><caption><p id="d2e904">L1 Main event categories and associated hazards.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="2">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Main Event</oasis:entry>
         <oasis:entry colname="col2">Associated Hazard(s)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Flood</oasis:entry>
         <oasis:entry colname="col2">Flood</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Extratropical Storm/Cyclone</oasis:entry>
         <oasis:entry colname="col2">Wind, Flood, Blizzard, Hail</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Tropical Storm/Cyclone</oasis:entry>
         <oasis:entry colname="col2">Wind, Flood, Lightning</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Extreme Temperature</oasis:entry>
         <oasis:entry colname="col2">Heatwave, Cold Spell</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Drought</oasis:entry>
         <oasis:entry colname="col2">Drought</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Wildfire</oasis:entry>
         <oasis:entry colname="col2">Wildfire</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Tornado</oasis:entry>
         <oasis:entry colname="col2">Wind</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <fig id="F1"><label>Figure 1</label><caption><p id="d2e998">A simplified representation of deaths caused by the 2021 European Floods as reported in the Wikimpacts 1.0 database. For this flood event, the database includes information at L1 (event level): Total deaths in the 2021 European Floods, L2 (national level): 196 deaths in Germany, L3 (sub-national level, polygon): 2 deaths in the state of Bavaria, and L3 (sub-national level, point): 23 deaths in the city of Pepinster. This is only a subset of the full information provided in the database for this event.</p></caption>
        <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f01.png"/>

      </fig>

      <p id="d2e1007">The Wikimpacts 1.0 database is stored in a relational format (Fig. <xref ref-type="fig" rid="F2"/>). As shown in Fig. <xref ref-type="fig" rid="F2"/>, the database permits only a single entry at the L1 level. Each L1 entry is associated with zero or more L2 and L3 entries. Each L2 entry can in turn be linked to zero or multiple L3 entries. If there are L3 entries, all L3 impacts within the same country are aggregated into a single L2 entry. There is no direct linkage between the L2 and L3 entries in the database; however, comparing the “Administrative_Area_GID” from the L3 entry with the “Administrative_Areas_GID” in the L2 entry enables identifying the corresponding entries. For all three levels, we provide a detailed breakdown of the schema, structure, and permitted values as follows: (i) Field: the specific names assigned to each piece of information within the schema; (ii) Data Type: the data format for each field (integer, string, list, boolean); (iii) Permitted Values: the range or set of allowed values for each field (e.g., specific categories, numeric ranges); (iv) Mandatory: an indication of whether the field is required (e.g. Yes/No). All main events must include L1 information, while L2 and L3 are optional and included only when relevant information is available in the corresponding Wikipedia article.</p>

      <fig id="F2" specific-use="star"><label>Figure 2</label><caption><p id="d2e1016">Wikimpacts 1.0 database structure. L1 records the complete event metadata, including the basic information. L2 and L3 store only location-, time-, and impact-related fields. Entries across L1–L3 are grouped by a shared Event_ID, but L2 and L3 entries are not directly linked and require additional administrative-area matching, with one L1 event potentially linked to multiple L2 entries, and one L2 entry potentially linked to multiple L3 entries (1:N). For further details on the information fields in the figure see Table <xref ref-type="table" rid="T1"/>.</p></caption>
        <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f02.png"/>

      </fig>

<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>Event Level (L1)</title>
      <p id="d2e1034">L1 includes both direct impacts (Deaths, Injuries, Homeless, Displaced, Affected, and Buildings Damaged) and monetary impacts (Damage and Insured Damage). All impact fields are nullable, but at least one impact must be present to report the event in our database. Basic information fields about the event, such as Event_ID, Event_Names, Sources, Start_Date_Year, and Administrative_Areas_Norm are mandatory at this level. We use the Database of Global Administrative Areas (GADM) level 0 administrative area to denote the Administrative_Areas_Norm field in our database <xref ref-type="bibr" rid="bib1.bibx16" id="paren.24"/>. This area representation may contain countries or other geographic entities, which we hereafter refer to as either a country or as a national-level location. We remain neutral regarding to jurisdictional claims made in any material presented in this paper and the associated database. The impact information refers to the event's overall impact (e.g. 243 deaths in Fig. <xref ref-type="fig" rid="F1"/>). Whenever possible, impact information from Wikipedia articles is sourced from parts of the text which explicitly state the total impact. If aggregated impacts for the main event are not explicitly stated in the article, we aggregate data from L2 to present the total impact in L1. Fields with names ending in “Approx” indicate whether the information extracted from the Wikipedia article is precise (Table <xref ref-type="table" rid="T3a"/>). Returning to our example of the 2021 European floods, the article specifies “243 deaths”, and the “Approx” field for this number in the database is thus marked as “False”. Conversely, if the article had stated “more than 200 deaths”, then the data would have been normalized to <inline-formula><mml:math id="M1" display="inline"><mml:mrow><mml:mo>[</mml:mo><mml:mn mathvariant="normal">201</mml:mn><mml:mo>,</mml:mo><mml:mn mathvariant="normal">301</mml:mn><mml:mo>]</mml:mo></mml:mrow></mml:math></inline-formula> in the database using predefined normalization rules (see Sect. S7), and the related “Approx” field would have been marked as “True”. Similarly, if the L1 impact information is inferred from L2, the related “Approx” field is also marked as “True”.</p>

<table-wrap id="T3a" specific-use="star"><label>Table 3</label><caption><p id="d2e1063">List of information fields in the Wikimpacts 1.0 database, their properties and the relevant database levels. DIRECT IMPACT includes deaths, injuries, displaced, homeless, affected and buildings damaged; MONETARY IMPACT includes damage and insured damage.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="5">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:colspec colnum="5" colname="col5" align="left"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Field</oasis:entry>
         <oasis:entry colname="col2">Data type</oasis:entry>
         <oasis:entry colname="col3">Permitted values</oasis:entry>
         <oasis:entry colname="col4">Mandatory</oasis:entry>
         <oasis:entry colname="col5">Applied</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5">level(s)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Event_ID</oasis:entry>
         <oasis:entry colname="col2">UUID</oasis:entry>
         <oasis:entry colname="col3">Short uuid, 7 characters</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1, L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Hazards</oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">String(s) from Table <xref ref-type="table" rid="T2"/></oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Main_Event</oasis:entry>
         <oasis:entry colname="col2">String</oasis:entry>
         <oasis:entry colname="col3">String from Table <xref ref-type="table" rid="T2"/></oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Event_Names</oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">String(s)</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Sources</oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">Valid URL(s)</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Areas_Norm</oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">National-level administrative area</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1, L2</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">names from OSM or UNSD</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Areas_Type<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">National-level administrative area types</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1, L2</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">from OSM, UNSD, or GAUL 2015</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Areas_GID<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">National-level administrative area</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1, L2</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">GIDs from GADM</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Areas_GeoJson<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">List[JSON]</oasis:entry>
         <oasis:entry colname="col3">National-level administrative area</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1, L2</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">GeoJSON objects from OSM</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Area_Norm</oasis:entry>
         <oasis:entry colname="col2">String</oasis:entry>
         <oasis:entry colname="col3">The national-level administrative</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">area name from OSM or UNSD</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Area_Type<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">String</oasis:entry>
         <oasis:entry colname="col3">The national-level administrative area</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">type from OSM, UNSD or GAUL 2015</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Area_GID<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">String</oasis:entry>
         <oasis:entry colname="col3">The national-level administrative</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">area GID from GADM</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Area_GeoJson<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">JSON</oasis:entry>
         <oasis:entry colname="col3">The national-level administrative area/division</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">GeoJSON objects from OSM</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Locations_Norm</oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">Area names within the specified</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">national-level administrative area</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Locations_Type<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">Area types (from OSM) within the specified</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">national-level administrative area</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Locations_GID<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">List[String]</oasis:entry>
         <oasis:entry colname="col3">Area GADM GIDs within the specified</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">national-level administrative area</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Locations_GeoJson <sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">List[JSON]</oasis:entry>
         <oasis:entry colname="col3">GeoJSON objects within the specified</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3">national-level administrative area</oasis:entry>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Start_Date_Day</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1–31</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1, L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Start_Date_Month</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1–12</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1, L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Start_Date_Year</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1034–2024</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L1, L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">End_Date_Day</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1–31</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1, L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">End_Date_Month</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1–12</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1, L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">End_Date_Year</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1034–2024</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1, L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_DIRECT_IMPACT_Min</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">0–inf</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_DIRECT_IMPACT_Max</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">0–inf</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_DIRECT_IMPACT_Approx<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">Boolean</oasis:entry>
         <oasis:entry colname="col3">True, False</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_MONETARY_IMPACT_Min</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">0–inf</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_MONETARY_IMPACT_Max</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">0–inf</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

<table-wrap id="T3b" specific-use="star"><label>Table 3</label><caption><p id="d2e1882">Continued.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="5">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:colspec colnum="5" colname="col5" align="left"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Field</oasis:entry>
         <oasis:entry colname="col2">Data type</oasis:entry>
         <oasis:entry colname="col3">Permitted values</oasis:entry>
         <oasis:entry colname="col4">Mandatory</oasis:entry>
         <oasis:entry colname="col5">Applied</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5">level(s)</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_MONETARY_IMPACT Approx<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">Boolean</oasis:entry>
         <oasis:entry colname="col3">True, False</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_MONETARY_IMPACT_Unit</oasis:entry>
         <oasis:entry colname="col2">String</oasis:entry>
         <oasis:entry colname="col3">ISO 4217 currency</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_MONETARY_IMPACT Inflation_Adjusted</oasis:entry>
         <oasis:entry colname="col2">Boolean</oasis:entry>
         <oasis:entry colname="col3">True, False</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_MONETARY_IMPACT Inflation_Adjusted_Year</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1034–2024</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L1</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Num_Min</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">0–inf</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Num_Max</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">0–inf</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Num_Approx<sup>*</sup></oasis:entry>
         <oasis:entry colname="col2">Boolean</oasis:entry>
         <oasis:entry colname="col3">True, False</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Num_Unit</oasis:entry>
         <oasis:entry colname="col2">String</oasis:entry>
         <oasis:entry colname="col3">ISO 4217 currency code</oasis:entry>
         <oasis:entry colname="col4">Yes</oasis:entry>
         <oasis:entry colname="col5">L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Num_Inflation_Adjusted</oasis:entry>
         <oasis:entry colname="col2">Boolean</oasis:entry>
         <oasis:entry colname="col3">True, False</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L2, L3</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Inflation_Adjusted_Year</oasis:entry>
         <oasis:entry colname="col2">Non-negative integer</oasis:entry>
         <oasis:entry colname="col3">1034–2024</oasis:entry>
         <oasis:entry colname="col4">No</oasis:entry>
         <oasis:entry colname="col5">L2, L3</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table><table-wrap-foot><p id="d2e1885"><sup>*</sup> Fields that are not included in the database evaluation process.</p></table-wrap-foot></table-wrap>

</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title>National Level (L2)</title>
      <p id="d2e2155">L2 breaks down the impact information at national level. The Administrative_Areas_Norm field is a list, typically containing the single country (17 802 entries in the database) in which the reported total impact occurred or, in rare cases, a list of countries (110 entries in the database) if the impact could not be fully disaggregated between a subset of countries. Figure <xref ref-type="fig" rid="F1"/> provides as example the total number of deaths in Germany during the 2021 European Floods, and Sect. S1 shows that L2 contains corresponding information for other countries affected by these floods. Spatial information on the L2 impacts is mandatory in order for them to be included in the database, while temporal information is not mandatory as the impact should logically fall within the time span specified in L1 (Table <xref ref-type="table" rid="T3a"/>). National-level impact information is not always available. In some cases, the overall impact at this level is unknown, but impact information for specific locations within a country is provided. In these cases, we aggregate the information from L3 to present it in L2.</p>
</sec>
<sec id="Ch1.S2.SS3">
  <label>2.3</label><title>Sub-national Level (L3)</title>
      <p id="d2e2171">L3 provides a detailed breakdown of impact information at a sub-national level (e.g., province, municipality) <xref ref-type="bibr" rid="bib1.bibx16 bib1.bibx34" id="paren.25"/>. Similarly to L1, we use the GADM level 0 administrative area to denote the Administrative_Area_Norm fields in this level. Figure <xref ref-type="fig" rid="F1"/> provides as example the information on number of deaths in L3 for the city of Pepinster (shown as a point) in Belgium and the state of Bavaria (shown as a polygon) in Germany. In most cases, the impact is confined to a single location, yet there are instances where the impact spans multiple places within the country. In that case, the field Administrative_Area_Norm contains the country, and the field Locations_Norm contains a list of specific locations within that country where the impact occurred. Like for L2, spatial information is mandatory at this level, while temporal information remains optional (Table <xref ref-type="table" rid="T3a"/>).</p>
</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Wikimpacts Processing Pipeline</title>
      <p id="d2e2191">The Wikimpacts processing pipeline comprises four modules (Fig. <xref ref-type="fig" rid="F3"/>). First, we select relevant articles for processing. Next, we apply a list of prompts to extract the necessary information. After extraction, we post-process the raw output to represent the data in standardized formats. Finally, we check for data consistency across the three levels, address missing information, convert currencies, adjust inflation, and format the database for ease of use. Each module is described in detail below.</p>

      <fig id="F3"><label>Figure 3</label><caption><p id="d2e2198">Full pipeline of the Wikimpacts 1.0 database construction (Icons by Icons8 provided under a free license at <uri>https://icons8.com/</uri>, last access: 20 May 2026).</p></caption>
        <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f03.png"/>

      </fig>

<sec id="Ch1.S3.SS1">
  <label>3.1</label><title>Document Selection</title>
      <p id="d2e2217">A three-step approach is used to select relevant English articles. First, we craft a keyword list covering all main event categories in the database, which we then use to extract relevant articles (see Sect. S2 for keywords). Querying Wikipedia using these English keywords (with a cut-off date at 29 February 2024), results in 30 085 articles. However, not all articles retrieved through this keyword extraction process are related to climate events. For instance, some refer to topics like “Miami Hurricanes football” <xref ref-type="bibr" rid="bib1.bibx66" id="paren.26"/>. Therefore, in a second step, to filter non-climate-related articles automatically, we apply as text classifier a pre-trained English distilled Bidirectional Encoder Representations from Transformers (BERT) model (DistilBert for sequence classification, accessed via the HuggingFace platform at <uri>https://huggingface.co/docs/transformers/en/model_doc/distilbert</uri>,  last access: 20 May 2026) <xref ref-type="bibr" rid="bib1.bibx12 bib1.bibx41" id="paren.27"/>). To this end, the BERT model is fine-tuned on a set of 300 Wikipedia articles, containing 248 relevant and 52 irrelevant articles.<fn id="Ch1.Footn1"><p id="d2e2229">For articles longer than 512 tokens, only the first 512 tokens are used.</p></fn> Using 150 articles for training, 100 articles for validation, and 50 articles for testing (with the relevance distribution shown in Table <xref ref-type="table" rid="T4"/>), we obtain an F1-score of 98.8 on the test set (with a precision score of 97.7 and a perfect recall score of 100.0; see Sect. S3 for definitions of F1-score, precision, and recall). From the original 30 085 articles, we classify 4900 as relevant in this second step. Thirdly, we manually check all these classified articles to confirm their relevance. We identify 184 false positives in the set of 4900 articles and another 330 false negatives in the remaining 25 185 articles. In the end, we identify 5046 English Wikipedia articles as relevant for further processing.</p>

<table-wrap id="T4"><label>Table 4</label><caption><p id="d2e2238">Article relevance distribution for the 300 English Wikipedia articles used to fine-tune the BERT model for text classification.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="3">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Data Set</oasis:entry>
         <oasis:entry colname="col2">Relevant</oasis:entry>
         <oasis:entry colname="col3">Irrelevant</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Training Data</oasis:entry>
         <oasis:entry colname="col2">128</oasis:entry>
         <oasis:entry colname="col3">22</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Validation Data</oasis:entry>
         <oasis:entry colname="col2">78</oasis:entry>
         <oasis:entry colname="col3">22</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Test Data</oasis:entry>
         <oasis:entry colname="col2">42</oasis:entry>
         <oasis:entry colname="col3">8</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e2306">It should be highlighted that some Wikipedia articles describe only one event, e.g., Hurricane Ida <xref ref-type="bibr" rid="bib1.bibx65" id="paren.28"/>, while other articles cover a series of events, such as the 2021 Atlantic hurricane season <xref ref-type="bibr" rid="bib1.bibx67" id="paren.29"/>. We refer to the former as the “single-event articles” and to the latter as “multi-event articles”. Multi-event articles present specific challenges. For some events, they serve as the sole source of information on Wikipedia, while for others, there exist dedicated “single-event articles” that provide more detailed information and should be used as the basis for those events. Moreover, the structure of multi-event articles differs significantly from that of single-event articles due to the number of events they cover, requiring a further processing step. To address this, we post-process the 5,046 articles to identify single- and multi-event articles. Using the GPT4o Mini model (version: gpt-4o-mini-2024-07-18), we extract relevant climatic events from the full set of 5046 Wikipedia articles. This yields 6625 events. We then conduct the reverse process, and search Wikipedia to locate the relevant articles for those events. In total, we identify 3368 events mapped to a unique Wikipedia article. The remaining 3257 events are linked to Wikipedia articles already identified as sources for at least one other climate event, suggesting that those articles are multi-event articles. Moreover, within the 3368 events mapped to a unique, we identify 222 cases of multi-event article entries. To detect these misclassified multi-event articles, we perform a keyword search using [“list”, “season”, “cyclones”, “hurricanes”, “typhoons”, “tornadoes”]. This procedure yields 212 entries containing the keyword “season” (e.g., 1939 Pacific hurricane season; <xref ref-type="bibr" rid="bib1.bibx51" id="altparen.30"/>), 5 entries containing the keyword “cyclones” (e.g., Tropical cyclones in 2013; <xref ref-type="bibr" rid="bib1.bibx62" id="altparen.31"/>), 1 entry containing the keyword “list” (e.g., Lists of tornadoes and tornado outbreaks; <xref ref-type="bibr" rid="bib1.bibx69" id="altparen.32"/>), 2 entries each containing the keyword “hurricanes” and “typhoons” respectively (e.g., Hurricanes in Nicaragua and Typhoons in Taiwan; <xref ref-type="bibr" rid="bib1.bibx58 bib1.bibx61" id="altparen.33"/>). For the keyword “tornadoes”, we treat tornado outbreaks as a single event (e.g. the “2017 Tulsa tornadoes” article; <xref ref-type="bibr" rid="bib1.bibx54" id="altparen.34"/>). For other major event types, such as floods and wildfires, we do not remove articles with plural titles (e.g., 2021 European floods; <xref ref-type="bibr" rid="bib1.bibx64" id="altparen.35"/>, 2015 Russian wildfires; <xref ref-type="bibr" rid="bib1.bibx53" id="altparen.36"/>), because these articles do not provide information for multiple individual flood or wildfire events. This filtering procedure ensures that the Wikimpacts 1.0 database is restricted to single-event articles and mitigates duplication arising from multi-event entries. The risk of duplicated information within single-event articles is expected to be relatively low, and we plan to verify this more systematically in future updates of the database. Notably, for hazard types beyond tropical cyclones, our event unit follows the Wikipedia single-event article. When a single-event article describes multiple related episodes (e.g., impacts in several countries, or multiple phases within the same system), we represent the content as one aggregated event record rather than attempting to delineate event boundaries. For example, the “2021 European floods” are stored as one event, with impacts accessible separately for each affected country via L2. In the remainder of the paper, we focus exclusively on those 3146 events mapped to a single-event article to construct the Wikimpacts 1.0 database.</p>
</sec>
<sec id="Ch1.S3.SS2">
  <label>3.2</label><title>Information Extraction Using GPT4o Model</title>
      <p id="d2e2346">A core component of our database construction pipeline is the application of the GPT4o model (version: gpt-4o-2024-05-13). Different from initial trials <xref ref-type="bibr" rid="bib1.bibx24" id="paren.37"/>, we employ the GPT4o model, released in 2024, rather than the GPT4 model because its longer context window <xref ref-type="bibr" rid="bib1.bibx33" id="paren.38"/> allows it to process a substantially larger number of input tokens, which is particularly beneficial for handling long Wikipedia articles. To extract information from Wikipedia articles, we feed the full text and the information box (if it exists) to the GPT4o model together with a set of prompts corresponding to the different fields of our database. We do not process tables or list items within them. Consequently, information that appears only in tables is currently excluded from the database. To facilitate post-processing, we instruct the GPT4o model to provide output in JSON. However, one issue we faced was that the model sometimes cannot produce valid JSON objects. This can occur due to the longer output length that exceeds the total number of permitted output tokens, as found by <xref ref-type="bibr" rid="bib1.bibx24" id="text.39"/> – for example when we instruct the model to return the text segment where it identifies the relevant information as a traceable source in the output but this is too long for JSON output. To mitigate this issue, each Wikipedia article is presented as a JSON file where each key is the header title of the  section in the Wikipedia article and each value is the verbatim text as it appears in Wikipedia. Compared to other text sources, Wikipedia articles are well-structured, enabling the extraction of the full text in the header-content pair format. In this setup, and for all fields, we instruct the model to provide a source section that includes the original section headers from the Wikipedia article where the information is found. This strategy also helps to prevent model hallucinations <xref ref-type="bibr" rid="bib1.bibx48" id="paren.40"/> since the model does not need to return large blocks of source text when extracting information on extreme climate impacts.</p>
      <p id="d2e2361">To obtain location and time information about the event in L1, we build prompts for the relevant information, and for the source section of this information. To obtain the location information, we ask the model to capture all locations affected by the event and retrieve the affected countries during post-processing. To obtain the main event category and the reported hazards, we provide the model with the list of main event categories and the hazards associated with each category (Table <xref ref-type="table" rid="T2"/>). Following this, we pose four prompts: the first for the event category, the second for the source section of the event category, the third for the associated hazards based on the result of the event category, and the last for the source section of the hazards. We then use more complex prompts to extract information on different impacts. These prompts partly rely on keywords used for categorising the impacts. These same keywords are also used in the annotation process (Sect. <xref ref-type="sec" rid="Ch1.S4.SS1"/>). The L1 information represents the total impact of the event, for which we use two prompts: one regarding the total impact and another pertaining to its source section. This is followed by information extraction at L2 and L3, as well as specifics on times and locations, if such details are available. Additionally, we prompt the model to capture L1 impact information only when explicitly stated in the text, such as in the 2021 European Floods example: “At least 243 people died in the floods”. If this information is not provided explicitly, the model is tasked to return “NULL” rather than summing individual data entries to produce a total for L1. Similarly, for L2, the model is tasked to return the total impact for specific countries only when explicitly available. If unavailable, it should not aggregate data from various locations within a country but instead return “NULL”. We also evaluate the performance of different prompt settings for information extraction. Our prompt design, evaluation and the complete text of the prompts used for full run production can be found in Sect. S4. We use what is termed “prompt v3.1” in the Supplement for all information categories, except the L1 location, where we use “prompt v3.2”.</p>
</sec>
<sec id="Ch1.S3.SS3">
  <label>3.3</label><title>Post-Processing</title>
      <p id="d2e2376">The outputs produced by the GPT4o model contain “raw” data (e.g. dates represented in a variety of formats or ambiguous location names) that often requires normalization i.e., conversion to a standardized format. We apply a set of normalization rules (see Sect. S7) to the raw data, ensuring that the post-processed model output can be evaluated and stored in a standardized format in the database. Overall, we normalise the main event, hazards, time, location, and numerical data prior to the evaluation. The detailed post-processing steps are listed below.</p>
<sec id="Ch1.S3.SS3.SSS1">
  <label>3.3.1</label><title>Main Event and Hazards</title>
      <p id="d2e2386">The model is prompted to identify the unique Main Event of each article, and the goal of the normalization is to validate that the model extracts a single Main Event belonging to one of the categorical variables, and that all extracted hazards are associated with that particular Main Event category (see Table <xref ref-type="table" rid="T2"/>). In case of multiple relevant Hazards, we prompt the model to split them with “<inline-formula><mml:math id="M15" display="inline"><mml:mo>|</mml:mo></mml:math></inline-formula>”, and in the normalization process, we convert this to a list.</p>
</sec>
<sec id="Ch1.S3.SS3.SSS2">
  <label>3.3.2</label><title>Time and Location</title>
      <p id="d2e2406">Dates extracted by the LLM appear in various locales or formats with some components missing (for example, the month and year may be known but not the day). Dates in their different locales, whether partial or complete, are standardized using <monospace>dateparser</monospace> <xref ref-type="bibr" rid="bib1.bibx5" id="paren.41"/> in Python.</p>
      <p id="d2e2415">The model is prompted to identify locations at different administrative levels (such as countries, cities, or provinces) for the three database levels (L1, L2, and L3). In prompt v3.2, the model is prompted to identify a list of countries affected by the main event in question, thus providing L1 information. In prompt v3.1, for L2, the model is prompted to produce a list of national-level locations where an impact could be quantified. For L3, the model is prompted to identify a single administrative area at the national level and to capture smaller administrative areas associated with the impact within that country. The normalization pipeline tries to disambiguate these locations using the Nominatim API Manual (<uri>https://nominatim.org/release-docs/develop/api/Overview/</uri>, last access: 20 May 2026) to search for locations on OpenStreetMap <xref ref-type="bibr" rid="bib1.bibx34" id="paren.42"/>, an open geographical database.</p>
      <p id="d2e2424">Location names are extracted verbatim from the article by the LLM, making the output prone to contain locations expressed in various spelling conventions or colloquial names. Often, the retrieved text may refer to locations that are under dispute or not recognized internationally. To mitigate this, we normalize all locations so that they fit within a single standard representation. The standard format for a normalized location is split over 4 fields representing: <list list-type="custom"><list-item><label>1.</label>
      <p id="d2e2429">the location's official English name (<monospace>_Norm</monospace>) whenever  available;</p></list-item><list-item><label>2.</label>
      <p id="d2e2436">the administrative address level or type (<monospace>_Type</monospace>) as defined by OpenStreetMap and returned in the Nominatim API raw output as defined by <xref ref-type="bibr" rid="bib1.bibx35" id="text.43"/>, or GAUL 2015 Admin 1 (<uri>https://data.apps.fao.org/catalog/dataset/gaul-code-list-global-admin-1</uri>, last access: 20 May 2026);</p></list-item><list-item><label>3.</label>
      <p id="d2e2449">the GADM GID (<monospace>_GID</monospace>) <xref ref-type="bibr" rid="bib1.bibx16" id="paren.44"/><fn id="Ch1.Footn2"><p id="d2e2457">Not all locations can be normalized to a GID given the limited level depth of GADM which may not represent small towns or may not group larger unofficial or disputed regions.</p></fn>; and</p></list-item><list-item><label>4.</label>
      <p id="d2e2462">a GeoJson object (<monospace>_GeoJson</monospace>) to visually represent the area on a map with a valid GeoJson type (such as <monospace>Polygon</monospace>). In Wikimpacts 1.0 database, GADM 4.1 version is used.</p></list-item></list></p>
      <p id="d2e2471">Location and region names are disambiguated using OpenStreetMap <xref ref-type="bibr" rid="bib1.bibx34" id="paren.45"/> and the UNSD M49 dataset (UNSD M49, UN, <uri>https://unstats.un.org/unsd/methodology/m49/</uri>, last access: 20 May 2026). When extracting GeoJson objects from OpenStreetMap, GeoJson shapes other than <monospace>Point</monospace> are preferred whenever available, but the pipeline falls back to <monospace>Point</monospace> if nothing else is available.</p>
</sec>
<sec id="Ch1.S3.SS3.SSS3">
  <label>3.3.3</label><title>Numerical Data</title>
      <p id="d2e2494">Often, LLM output extracts numerical information with phrasing that renders it open to interpretation (e.g., “No less than 12 people were injured” or “Billions of dollars were paid in damages”). It may also extract single numbers expressed in different locales dictating whether decimals use periods or commas. The normalization process aims to transform such expressions into quantifiable and standardized formats. Normalized numbers are represented in a range spread over three columns:  <inline-formula><mml:math id="M16" display="inline"><mml:mrow><mml:mo>〈</mml:mo><mml:mtext mathvariant="italic">min</mml:mtext><mml:mo>,</mml:mo><mml:mtext mathvariant="italic">max</mml:mtext><mml:mo>,</mml:mo><mml:mtext mathvariant="monospace">approximation</mml:mtext><mml:mo>〉</mml:mo></mml:mrow></mml:math></inline-formula> where “approximation” is a boolean representing whether the information is an exact number or an approximation of the exact number.</p>
      <p id="d2e2517">In short, the normalization process for numbers automatically checks if an immediate conversion of the expression to a number or range is possible (e.g., “1421” or “20–30” can quickly be converted to <inline-formula><mml:math id="M17" display="inline"><mml:mrow><mml:mo>〈</mml:mo><mml:mn mathvariant="normal">1421</mml:mn><mml:mo>,</mml:mo><mml:mn mathvariant="normal">1421</mml:mn><mml:mo>,</mml:mo><mml:mtext mathvariant="monospace">False</mml:mtext><mml:mo>〉</mml:mo></mml:mrow></mml:math></inline-formula> or <inline-formula><mml:math id="M18" display="inline"><mml:mrow><mml:mo>〈</mml:mo><mml:mn mathvariant="normal">20</mml:mn><mml:mo>,</mml:mo><mml:mn mathvariant="normal">30</mml:mn><mml:mo>,</mml:mo><mml:mtext mathvariant="monospace">True</mml:mtext><mml:mo>〉</mml:mo></mml:mrow></mml:math></inline-formula>). If not, the normalization script checks for any quantifiers such as “tens of thousands of homes were destroyed” or “No less than 20 deaths” and converts them into a range (the two previously mentioned examples would be normalized to <inline-formula><mml:math id="M19" display="inline"><mml:mrow><mml:mo>〈</mml:mo><mml:mn mathvariant="normal">20</mml:mn><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">000</mml:mn><mml:mo>,</mml:mo><mml:mn mathvariant="normal">90</mml:mn><mml:mspace width="0.125em" linebreak="nobreak"/><mml:mn mathvariant="normal">000</mml:mn><mml:mo>,</mml:mo><mml:mtext mathvariant="monospace">True</mml:mtext><mml:mo>〉</mml:mo></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M20" display="inline"><mml:mrow><mml:mo>〈</mml:mo><mml:mn mathvariant="normal">20</mml:mn><mml:mo>,</mml:mo><mml:mn mathvariant="normal">30</mml:mn><mml:mo>,</mml:mo><mml:mtext mathvariant="monospace">True</mml:mtext><mml:mo>〉</mml:mo></mml:mrow></mml:math></inline-formula>. A list of synonyms is used to determine whether or not a number is an approximation. This rule-based approach also employs part-of-speech tags and entities identified by SpaCy's English transformer pipeline model (SpaCy Manual, <uri>https://spacy.io/</uri>, last access: 20 May 2026), to extract min and max values for more complex expressions. The rules we applied in this step for normalizing different expressions into ranges are described in detail in Sect. S7.</p>
</sec>
</sec>
<sec id="Ch1.S3.SS4">
  <label>3.4</label><title>Database Consolidation</title>
      <p id="d2e2618">During the consolidation process, we filter out events that do not fall within our predefined main event types or hazard categories, such as “geomagnetic storm”, or “landslide”. Nonetheless, these events may be implicitly accounted for in the impact data, for example if the reported impacts for a flood include the impacts of a landslide triggered by the flood. Upon constructing the initial database, we identify missing information at various levels. For instance, the attribute Total_Deaths for a particular event might be recorded as NULL at L1, while at L2, there could be an entry indicating 20 fatalities in Germany. Furthermore, the cumulative impact at L3 within a single country might exceed the documented impact at L2 for the same country, and similarly, aggregated L2 data might provide larger values than the information available at L1.</p>
      <p id="d2e2621">To address these discrepancies and ensure data consistency across the database, we adopt a bottom-up approach beginning with L3. We sum L3 impact values for a given country and compare these to L2. If L2 provides a range, we adjust the minimum and maximum of the range if necessary. If L2 provides a single number, we transform this into a range if it is lower than the aggregated information from L3. We repeat the same procedure for L1, by aggregating impact values from L2. Detailed rules and procedures are provided in Sect. S8.</p>
      <p id="d2e2624">In addition to addressing these data inconsistencies, we standardize currencies and adjust for inflation throughout the database, choosing USD as the base currency. Using the currency statistics from the Wikimpacts 1.0 database, we obtain conversion rates for most non-USD currencies from a publicly available resource <xref ref-type="bibr" rid="bib1.bibx2" id="paren.46"/>. For periods before a currency's available data, a constant currency conversion rate is applied as the earliest available year. Additionally, we include EUR as a secondary standardized currency, with USD-2024-inflation-adjusted values converted to EUR using the 2024 average conversion rate.</p>
      <p id="d2e2630">Our approach to inflation adjustments follows the same rules as those documented by EM-DAT (Minneapolis Fed CPI calculator, <uri>https://www.minneapolisfed.org/about-us/monetary-policy/inflation-calculator/consumer-price-index-1800-</uri>, last access: 20 May 2026; EM-DAT protocol, <uri>https://doc.emdat.be/docs/protocols/economic-adjustment/</uri>, last access: 20 May 2026). In Wikimpacts 1.0, all monetary values are adjusted to reflect 2024's inflation rates, except for events occurring in 2024, which are left unadjusted for inflation. Detailed information on these adjustments is provided in Sect. S8.</p>
</sec>
</sec>
<sec id="Ch1.S4">
  <label>4</label><title>Evaluation of the Pipeline</title>
<sec id="Ch1.S4.SS1">
  <label>4.1</label><title>Data Annotation</title>
      <p id="d2e2656">As part of Wikimpacts 1.0, we develop a gold standard dataset by manually annotating Wikipedia articles. The gold standard events are randomly sampled from the original set of 5046 classified articles, and only the subset of single-event articles are annotated for Wikimpacts 1.0 database development, with the constraint that their event-type distribution is representative of that of the entire database. The annotation was conducted over the course of one year by two postdoctoral researchers in climate science and two researchers with a master's degree in water engineering. This gold standard dataset includes a development set containing 70 main events (used to develop the information extraction pipeline) and a test set containing 156 main events (used exclusively for evaluation of the GPT4o model output). The disaster type distribution of these two sets is shown in Sect. S5 and Table S6 in the Supplement. Compared to preliminary results from <xref ref-type="bibr" rid="bib1.bibx24" id="text.47"/>, part of these annotated data now include L2 and L3 information. In the development set, we have 55 events with L2 and L3 information annotated, while in the test set, there are 97 events annotated with this additional level of impact information. An error rate for each field provided by the GPT4o model is calculated by comparing the LLM output with the gold standard.</p>
      <p id="d2e2662">We recognise that manual annotation is not error-proof. To ensure consistent and robust annotation, we provided the annotators with a list of keywords for detecting impacts (see Table <xref ref-type="table" rid="T5"/>). We further established comprehensive logical normalization rules for the annotators to follow. These correspond to the post-processing rules for the Wikimpacts database (see Sect. S7).</p>

<table-wrap id="T5" specific-use="star"><label>Table 5</label><caption><p id="d2e2670">Keywords used for identifying impact fields in the annotation process of the Wikimpacts 1.0 database and in some of the prompts (see Sect. S4).</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="2">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Variable</oasis:entry>
         <oasis:entry colname="col2">Keywords</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Deaths</oasis:entry>
         <oasis:entry colname="col2">die, dead, killed, fatality, lost lives, perished, passed away</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Injuries</oasis:entry>
         <oasis:entry colname="col2">injured, hurt, wound, hospitalized</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Homeless</oasis:entry>
         <oasis:entry colname="col2">lost home, homeless, household damage, household destroy, house damage, home destroy, unhoused,</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">without shelter, houseless, shelterless</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Displaced</oasis:entry>
         <oasis:entry colname="col2">evacuated, displace, transfer/move to shelter, relocated, flee</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Affected</oasis:entry>
         <oasis:entry colname="col2">affect, impact, influence</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Buildings_Damaged</oasis:entry>
         <oasis:entry colname="col2">home, house, household, building, apartment, apartment block, school, church, office buildings, retail stores,</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">hotels, hospitals, dwellings, structures</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Insured_Damage</oasis:entry>
         <oasis:entry colname="col2">insurance, insured</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Damage</oasis:entry>
         <oasis:entry colname="col2">damage, economic, economy</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

<sec id="Ch1.S4.SS1.SSSx1" specific-use="unnumbered">
  <title>Internal Annotation Agreement Evaluation</title>
      <p id="d2e2792">The quality of our gold data is assessed using 10 articles annotated independently by two different annotators. One annotator provided annotations without explicitly classifying information as L2 or L3, and we inferred the L2 and L3 levels based on location information annotated at either the national or sub-national level. The second annotator explicitly defined L2 and L3 information for the same articles.</p>
      <p id="d2e2795">For L1, both annotators extract identical information, resulting in error rates of “0” across all fields, as shown in Sect. S5, Table S7. However, in the L2 and L3 evaluations, some discrepancy between the two annotators is apparent. These discrepancies depend on differences in the number of annotated entries, resulting from the two annotators interpreting the text differently (see Sect. S5, Tables S8 and S9). For L2 annotations, some cases involved one annotator transferring information from L3 into L2. For instance, in the event “Typhoon Talim (2017)” <xref ref-type="bibr" rid="bib1.bibx68" id="paren.48"/>, the text under the subsection on impacts in Japan states: “On Saiki City and Tsukumi City in Oita Prefecture, some residents were trapped in their houses due to flash floods, which were immediately rescued by the authorities. Five homes were entirely destroyed, 615 were partially destroyed, and 804 were partially damaged, according to reports”, one annotator created 3 L2 entries for buidlings damaged in Japan, although this should have been recorded as an L3 entry. For L3 entries, discrepancies emerge for example from different subjective choices on which locations to retain. For instance, in the event “Cyclone Vayu” <xref ref-type="bibr" rid="bib1.bibx59" id="paren.49"/>, one annotator created an L3 entry with “Locations” as “Ullal&amp;India<inline-formula><mml:math id="M21" display="inline"><mml:mo>|</mml:mo></mml:math></inline-formula>Gujarat&amp;India” and “Buildings Damaged” as “15”, while the other annotator recorded the same event with “Locations” as “Ullal&amp;India”. Upon examining the original text, we find that both interpretations are logical: one annotator retained “Ullal”, a location mentioned in the impact sentence, while the other included “Gujarat”, mentioned in the leading sentence of the related impact in the paragraph. These variations in interpretation contribute to inter-annotator agreement errors. Such discrepancies in the L2 and L3 annotations will be addressed in a forthcoming version of the database.</p>
</sec>
</sec>
<sec id="Ch1.S4.SS2">
  <label>4.2</label><title>Evaluation Methods</title>
      <p id="d2e2820">We evaluate the LLM output using the above-described test set from the gold standard data. The evaluation involves all three levels of information. For all main events, the three levels contain many fields, making evaluation challenging. To obtain an overall aggregated score for each event, as well as scores for specific fields, we define a difference error metric for each field, ranging from 0 to 1 (where lower values indicate better performance). We then calculate an aggregated score as a weighted sum of these field-specific scores:

            <disp-formula id="Ch1.E1" content-type="numbered"><label>1</label><mml:math id="M22" display="block"><mml:mrow><mml:mi>D</mml:mi><mml:mo>(</mml:mo><mml:mi>a</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mo>)</mml:mo><mml:mo>:=</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mn mathvariant="normal">1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mstyle><mml:munder><mml:mo movablelimits="false">∑</mml:mo><mml:mi>i</mml:mi></mml:munder><mml:msub><mml:mi>w</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>d</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mfenced close=")" open="("><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>r</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfenced></mml:mrow></mml:math></disp-formula>

          <inline-formula><mml:math id="M23" display="inline"><mml:mrow><mml:mi>D</mml:mi><mml:mo>(</mml:mo><mml:mi>a</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula> is the difference between a gold entry <inline-formula><mml:math id="M24" display="inline"><mml:mi>a</mml:mi></mml:math></inline-formula> and an LLM output entry <inline-formula><mml:math id="M25" display="inline"><mml:mi>r</mml:mi></mml:math></inline-formula>, with weights <inline-formula><mml:math id="M26" display="inline"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and difference metrics <inline-formula><mml:math id="M27" display="inline"><mml:mrow><mml:msub><mml:mi>d</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> of fields <inline-formula><mml:math id="M28" display="inline"><mml:mi>i</mml:mi></mml:math></inline-formula>, where <inline-formula><mml:math id="M29" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> is the number of fields. This approach allows to adjust the relative influence of each field by modifying its weight. Since the importance of the different fields is user-dependent, in this paper we present evaluation results with an equal weighting of all fields.</p>
      <p id="d2e2948">The difference metrics for specific fields are defined based on metrics for the following basic types: numbers, strings, booleans, and lists. <list list-type="bullet"><list-item>
      <p id="d2e2953">For (non-negative) numbers:<disp-formula id="Ch1.E2" content-type="numbered"><label>2</label><mml:math id="M30" display="block"><mml:mrow><mml:msub><mml:mi>d</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mi>a</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mo>)</mml:mo><mml:mo>:=</mml:mo><mml:mfenced open="{" close=""><mml:mtable class="array" columnalign="left left"><mml:mtr><mml:mtd><mml:mrow><mml:mn mathvariant="normal">0</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mtext>if</mml:mtext><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mspace linebreak="nobreak" width="0.25em"/><mml:mi>a</mml:mi><mml:mo>=</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mstyle displaystyle="false"><mml:mstyle displaystyle="false"><mml:mfrac style="text"><mml:mrow><mml:mo>|</mml:mo><mml:mi>a</mml:mi><mml:mo>-</mml:mo><mml:mi>r</mml:mi><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:mi>a</mml:mi><mml:mo>+</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac></mml:mstyle></mml:mstyle><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mtext>otherwise</mml:mtext></mml:mtd></mml:mtr></mml:mtable></mml:mfenced></mml:mrow></mml:math></disp-formula></p></list-item><list-item>
      <p id="d2e3029">For strings and booleans:<disp-formula id="Ch1.E3" content-type="numbered"><label>3</label><mml:math id="M31" display="block"><mml:mrow><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>,</mml:mo><mml:mi>b</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mi>a</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mo>)</mml:mo><mml:mo>:=</mml:mo><mml:mfenced open="{" close=""><mml:mtable class="array" columnalign="left left"><mml:mtr><mml:mtd><mml:mrow><mml:mn mathvariant="normal">0</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mtext>if</mml:mtext><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mspace width="0.25em" linebreak="nobreak"/><mml:mi>a</mml:mi><mml:mo>=</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mtext>otherwise</mml:mtext></mml:mtd></mml:mtr></mml:mtable></mml:mfenced></mml:mrow></mml:math></disp-formula></p></list-item><list-item>
      <p id="d2e3091">For lists:<disp-formula id="Ch1.E4" content-type="numbered"><label>4</label><mml:math id="M32" display="block"><mml:mrow><mml:msub><mml:mi>d</mml:mi><mml:mi>s</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mi>a</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mo>)</mml:mo><mml:mo>:=</mml:mo><mml:mn mathvariant="normal">1</mml:mn><mml:mo>-</mml:mo><mml:mstyle displaystyle="true"><mml:mfrac style="display"><mml:mrow><mml:mo>|</mml:mo><mml:mi>a</mml:mi><mml:mo>∩</mml:mo><mml:mi>r</mml:mi><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:mo>|</mml:mo><mml:mi>a</mml:mi><mml:mo>∪</mml:mo><mml:mi>r</mml:mi><mml:mo>|</mml:mo></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:math></disp-formula></p></list-item></list></p>
      <p id="d2e3144">Rather than using more conventional evaluation metrics (such as accuracy, recall, or precision), we opt to use metrics tailored to the database's specific application: representing climate extremes and their impacts. For instance, if the correct number of deaths is 10, an output of 11 would result in a minor error, whereas an output of 100 would be a substantial error. Under the current metric, these predictions receive a normalized error rates of 0.048 and 0.818, respectively.</p>
      <p id="d2e3147">In this paper, we evaluate only those fields that are directly extracted by GPT4o, excluding any post-processed or otherwise derived fields. Specifically, our assessment is limited to the fields in Table <xref ref-type="table" rid="T3a"/> that appear without an asterisk, as the asterisked fields are obtained through post-processing rather than representing the raw output of the LLM. For the evaluation of L1, the LLM output is automatically matched with the gold standard using the Event_ID since only a single entry is retrieved per article in L1. However, for L2 and L3, the number of entries extracted by the LLM may vary, compared to the gold standard. For instance, for the same event there may be 5 entries in L2 from the gold standard, but 10 entries in the LLM output. To address this, we implement a matching algorithm during the L2/L3 evaluation process that identifies the most similar entries in the LLM output and the gold standard. The matching algorithm uses the same evaluation metrics as above to determine similarity of entries as <inline-formula><mml:math id="M33" display="inline"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>-</mml:mo><mml:mi>d</mml:mi><mml:mo>(</mml:mo><mml:mi>a</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:math></inline-formula>, and the best matching entry pairs in the LLM output and the gold standard are then selected. The remaining entries in the gold data or the LLM output are matched to empty entries padded with “NULL” values. This results in two lists of entries of equal length, which is the desired format for evaluation. In the matching algorithm, it is possible to select different values for some important parameters: <list list-type="bullet"><list-item>
      <p id="d2e3176">the similarity threshold under which entries are not considered to be a good match</p></list-item><list-item>
      <p id="d2e3180">the weights for different fields used when matching</p></list-item><list-item>
      <p id="d2e3184">the null penalty, which is the error value assigned in the difference metrics when one of the two entries contains a “NULL” value</p></list-item></list></p>
      <p id="d2e3188">We use the 55 events in the gold standard development set to select the matching algorithm's parameters setting. For the rest of the evaluation, we use the parameter set termed “Setting 2” in Sect. S5, Table S10.</p>
</sec>
<sec id="Ch1.S4.SS3">
  <label>4.3</label><title>Evaluation Results</title>
      <p id="d2e3199">Table <xref ref-type="table" rid="T6"/> shows that the model performs consistently well across all L1 fields in the test set. The error rates for Main Event and Hazards are 0.0256 and 0.2004, respectively, indicating that the model effectively captures robust information for the Main Event and comparatively reliable information for the associated hazards. Regarding time-related information, the model achieves near-perfect performance, with error rates ranging from 0.0003 to 0.0463. However, the location information exhibits a higher error rate of 0.4843. For the impact categories, Total Deaths has the lowest error rates, ranging from 0.0236 to 0.0374; Total Damage and Total Insured Damage also show low error rates of approximately 0.07 and 0.012, respectively. For other impact categories, error rates range from 0.2118 to 0.311, indicating that the LLM encounters difficulties in capturing this information from Wikipedia articles.</p>

<table-wrap id="T6"><label>Table 6</label><caption><p id="d2e3207">The L1 evaluation results on the gold standard test set. The Weighted Score represents the average across all fields, given an equal weighting. Scores for each field are also averaged. For instance, the score of 0.0256 in the “Main_Event” field corresponds to the average score for all 156 test set events within this category. Numbers closer to 0 indicate a close match between two entries, while numbers closer to 1 indicate a poorer match.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="2">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="center"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Field</oasis:entry>
         <oasis:entry colname="col2">Score</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Weighted_Score</oasis:entry>
         <oasis:entry colname="col2">0.1431</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Main_Event</oasis:entry>
         <oasis:entry colname="col2">0.0256</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Hazards</oasis:entry>
         <oasis:entry colname="col2">0.2004</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Day</oasis:entry>
         <oasis:entry colname="col2">0.0299</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Month</oasis:entry>
         <oasis:entry colname="col2">0.0115</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Year</oasis:entry>
         <oasis:entry colname="col2">0.0003</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">End_Date_Day</oasis:entry>
         <oasis:entry colname="col2">0.0463</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">End_Date_Month</oasis:entry>
         <oasis:entry colname="col2">0.0194</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">End_Date_Year</oasis:entry>
         <oasis:entry colname="col2">0.0066</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Administrative_Areas_Norm</oasis:entry>
         <oasis:entry colname="col2">0.4843</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Deaths_Min</oasis:entry>
         <oasis:entry colname="col2">0.0374</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Deaths_Max</oasis:entry>
         <oasis:entry colname="col2">0.0236</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Injuries_Max</oasis:entry>
         <oasis:entry colname="col2">0.2118</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Injuries_Min</oasis:entry>
         <oasis:entry colname="col2">0.2115</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Homeless_Min</oasis:entry>
         <oasis:entry colname="col2">0.2559</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Homeless_Max</oasis:entry>
         <oasis:entry colname="col2">0.2528</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Displaced_Min</oasis:entry>
         <oasis:entry colname="col2">0.2950</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Displaced_Max</oasis:entry>
         <oasis:entry colname="col2">0.2963</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Affected_Min</oasis:entry>
         <oasis:entry colname="col2">0.3110</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Total_Affected_Max</oasis:entry>
         <oasis:entry colname="col2">0.2993</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Buildings_Damaged_Min</oasis:entry>
         <oasis:entry colname="col2">0.2827</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Buildings_Damaged_Max</oasis:entry>
         <oasis:entry colname="col2">0.2797</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Insured_Damage_Min</oasis:entry>
         <oasis:entry colname="col2">0.1218</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Insured_Damage_Max</oasis:entry>
         <oasis:entry colname="col2">0.1218</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Insured_Damage_Unit</oasis:entry>
         <oasis:entry colname="col2">0.1474</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Insured_Damage_Inflation_Adjusted</oasis:entry>
         <oasis:entry colname="col2">0.1667</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Insured_Damage_Inflation_Adjusted_Year</oasis:entry>
         <oasis:entry colname="col2">0.0064</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Damage_Min</oasis:entry>
         <oasis:entry colname="col2">0.0706</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Damage_Max</oasis:entry>
         <oasis:entry colname="col2">0.0729</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Damage_Unit</oasis:entry>
         <oasis:entry colname="col2">0.0321</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Damage_Inflation_Adjusted</oasis:entry>
         <oasis:entry colname="col2">0.1026</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Total_Damage_Inflation_Adjusted_Year</oasis:entry>
         <oasis:entry colname="col2">0.0128</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

      <p id="d2e3527">Tables <xref ref-type="table" rid="T7"/> and <xref ref-type="table" rid="T8"/> present the evaluation results for L2 and L3. For these two levels, the model's performance on the test set is comparable to its performance on the development set (see Sect. S5, Table S11). Next to the Weighted_Score in each impact category, the error rates for individual fields within the impact categories are presented in these tables. The location field Administrative_Areas_Norm exhibits the highest error rate across all impact categories in L2. Similarly, in L3, both Administrative_Area_Norm and Locations_Norm display higher error rates compared to other fields. Notably, time-related information in both L2 and L3 has relatively low error rates, which are generally lower than the Weighted_Score. For impact information fields such as Num_Min and Num_Max, L2 generally achieves lower error rates compared to L3. Referring to the Weighted_Score across all impact categories, the information in L2 is more robust than that in L3 within our database. Furthermore, across impact categories, Injuries, Homeless, and Displaced exhibit relatively lower error rates than other categories.</p>

<table-wrap id="T7" specific-use="star"><label>Table 7</label><caption><p id="d2e3538">The L2 evaluation results on the gold standard test set, for each field within the impact categories. The Weighted Score represents the average across all fields in a given impact category, which are given an equal weighting. For example, the Weighted Score “0.4221” for “Deaths” is the mean error of all the fields in this category.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="9">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right"/>
     <oasis:colspec colnum="8" colname="col8" align="right"/>
     <oasis:colspec colnum="9" colname="col9" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Deaths</oasis:entry>
         <oasis:entry colname="col3">Injuries</oasis:entry>
         <oasis:entry colname="col4">Homeless</oasis:entry>
         <oasis:entry colname="col5">Displaced</oasis:entry>
         <oasis:entry colname="col6">Affected</oasis:entry>
         <oasis:entry colname="col7">Buildings_Damaged</oasis:entry>
         <oasis:entry colname="col8">Insured_Damage</oasis:entry>
         <oasis:entry colname="col9">Damage</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Weighted_Score</oasis:entry>
         <oasis:entry colname="col2">0.4221</oasis:entry>
         <oasis:entry colname="col3">0.3171</oasis:entry>
         <oasis:entry colname="col4">0.3928</oasis:entry>
         <oasis:entry colname="col5">0.3709</oasis:entry>
         <oasis:entry colname="col6">0.4695</oasis:entry>
         <oasis:entry colname="col7">0.5125</oasis:entry>
         <oasis:entry colname="col8">0.5308</oasis:entry>
         <oasis:entry colname="col9">0.4772</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Day</oasis:entry>
         <oasis:entry colname="col2">0.2310</oasis:entry>
         <oasis:entry colname="col3">0.2479</oasis:entry>
         <oasis:entry colname="col4">0.3051</oasis:entry>
         <oasis:entry colname="col5">0.3321</oasis:entry>
         <oasis:entry colname="col6">0.4247</oasis:entry>
         <oasis:entry colname="col7">0.4860</oasis:entry>
         <oasis:entry colname="col8">0.8210</oasis:entry>
         <oasis:entry colname="col9">0.5542</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Month</oasis:entry>
         <oasis:entry colname="col2">0.2310</oasis:entry>
         <oasis:entry colname="col3">0.2479</oasis:entry>
         <oasis:entry colname="col4">0.3051</oasis:entry>
         <oasis:entry colname="col5">0.3321</oasis:entry>
         <oasis:entry colname="col6">0.4219</oasis:entry>
         <oasis:entry colname="col7">0.4832</oasis:entry>
         <oasis:entry colname="col8">0.8198</oasis:entry>
         <oasis:entry colname="col9">0.5550</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Year</oasis:entry>
         <oasis:entry colname="col2">0.5446</oasis:entry>
         <oasis:entry colname="col3">0.3277</oasis:entry>
         <oasis:entry colname="col4">0.3517</oasis:entry>
         <oasis:entry colname="col5">0.3931</oasis:entry>
         <oasis:entry colname="col6">0.4665</oasis:entry>
         <oasis:entry colname="col7">0.5902</oasis:entry>
         <oasis:entry colname="col8">0.8198</oasis:entry>
         <oasis:entry colname="col9">0.6906</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">End_Date_Day</oasis:entry>
         <oasis:entry colname="col2">0.2244</oasis:entry>
         <oasis:entry colname="col3">0.1849</oasis:entry>
         <oasis:entry colname="col4">0.2288</oasis:entry>
         <oasis:entry colname="col5">0.1870</oasis:entry>
         <oasis:entry colname="col6">0.2987</oasis:entry>
         <oasis:entry colname="col7">0.4039</oasis:entry>
         <oasis:entry colname="col8">0.7477</oasis:entry>
         <oasis:entry colname="col9">0.4830</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">End_Date_Month</oasis:entry>
         <oasis:entry colname="col2">0.2244</oasis:entry>
         <oasis:entry colname="col3">0.1849</oasis:entry>
         <oasis:entry colname="col4">0.2288</oasis:entry>
         <oasis:entry colname="col5">0.1870</oasis:entry>
         <oasis:entry colname="col6">0.2946</oasis:entry>
         <oasis:entry colname="col7">0.4012</oasis:entry>
         <oasis:entry colname="col8">0.7477</oasis:entry>
         <oasis:entry colname="col9">0.4868</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">End_Date_Year</oasis:entry>
         <oasis:entry colname="col2">0.2508</oasis:entry>
         <oasis:entry colname="col3">0.2101</oasis:entry>
         <oasis:entry colname="col4">0.2331</oasis:entry>
         <oasis:entry colname="col5">0.1985</oasis:entry>
         <oasis:entry colname="col6">0.3163</oasis:entry>
         <oasis:entry colname="col7">0.4037</oasis:entry>
         <oasis:entry colname="col8">0.7523</oasis:entry>
         <oasis:entry colname="col9">0.4981</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Administrative_Areas_Norm</oasis:entry>
         <oasis:entry colname="col2">0.7665</oasis:entry>
         <oasis:entry colname="col3">0.9076</oasis:entry>
         <oasis:entry colname="col4">0.9576</oasis:entry>
         <oasis:entry colname="col5">0.9351</oasis:entry>
         <oasis:entry colname="col6">0.9617</oasis:entry>
         <oasis:entry colname="col7">0.9358</oasis:entry>
         <oasis:entry colname="col8">0.9775</oasis:entry>
         <oasis:entry colname="col9">0.7887</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Min</oasis:entry>
         <oasis:entry colname="col2">0.6618</oasis:entry>
         <oasis:entry colname="col3">0.2724</oasis:entry>
         <oasis:entry colname="col4">0.4619</oasis:entry>
         <oasis:entry colname="col5">0.3864</oasis:entry>
         <oasis:entry colname="col6">0.5208</oasis:entry>
         <oasis:entry colname="col7">0.4543</oasis:entry>
         <oasis:entry colname="col8">0.1570</oasis:entry>
         <oasis:entry colname="col9">0.4030</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Max</oasis:entry>
         <oasis:entry colname="col2">0.6643</oasis:entry>
         <oasis:entry colname="col3">0.2702</oasis:entry>
         <oasis:entry colname="col4">0.4633</oasis:entry>
         <oasis:entry colname="col5">0.3865</oasis:entry>
         <oasis:entry colname="col6">0.5208</oasis:entry>
         <oasis:entry colname="col7">0.4541</oasis:entry>
         <oasis:entry colname="col8">0.1573</oasis:entry>
         <oasis:entry colname="col9">0.4023</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Unit</oasis:entry>
         <oasis:entry colname="col2">NA</oasis:entry>
         <oasis:entry colname="col3">NA</oasis:entry>
         <oasis:entry colname="col4">NA</oasis:entry>
         <oasis:entry colname="col5">NA</oasis:entry>
         <oasis:entry colname="col6">NA</oasis:entry>
         <oasis:entry colname="col7">NA</oasis:entry>
         <oasis:entry colname="col8">0.1757</oasis:entry>
         <oasis:entry colname="col9">0.4151</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Inflation_Adjusted</oasis:entry>
         <oasis:entry colname="col2">NA</oasis:entry>
         <oasis:entry colname="col3">NA</oasis:entry>
         <oasis:entry colname="col4">NA</oasis:entry>
         <oasis:entry colname="col5">NA</oasis:entry>
         <oasis:entry colname="col6">NA</oasis:entry>
         <oasis:entry colname="col7">NA</oasis:entry>
         <oasis:entry colname="col8">0.1892</oasis:entry>
         <oasis:entry colname="col9">0.4415</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Inflation_Adjusted_Year</oasis:entry>
         <oasis:entry colname="col2">NA</oasis:entry>
         <oasis:entry colname="col3">NA</oasis:entry>
         <oasis:entry colname="col4">NA</oasis:entry>
         <oasis:entry colname="col5">NA</oasis:entry>
         <oasis:entry colname="col6">NA</oasis:entry>
         <oasis:entry colname="col7">NA</oasis:entry>
         <oasis:entry colname="col8">0.0045</oasis:entry>
         <oasis:entry colname="col9">0.0075</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table><table-wrap-foot><p id="d2e3541">NA: not available.</p></table-wrap-foot></table-wrap>

<table-wrap id="T8" specific-use="star"><label>Table 8</label><caption><p id="d2e4014">The L3 evaluation results of the gold standard test set, presented following the same format as in Table <xref ref-type="table" rid="T7"/>.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="9">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right"/>
     <oasis:colspec colnum="8" colname="col8" align="right"/>
     <oasis:colspec colnum="9" colname="col9" align="right"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Deaths</oasis:entry>
         <oasis:entry colname="col3">Injuries</oasis:entry>
         <oasis:entry colname="col4">Homeless</oasis:entry>
         <oasis:entry colname="col5">Displaced</oasis:entry>
         <oasis:entry colname="col6">Affected</oasis:entry>
         <oasis:entry colname="col7">Buildings_Damaged</oasis:entry>
         <oasis:entry colname="col8">Insured_Damage</oasis:entry>
         <oasis:entry colname="col9">Damage</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Weighted_Score</oasis:entry>
         <oasis:entry colname="col2">0.4896</oasis:entry>
         <oasis:entry colname="col3">0.4228</oasis:entry>
         <oasis:entry colname="col4">0.4582</oasis:entry>
         <oasis:entry colname="col5">0.4684</oasis:entry>
         <oasis:entry colname="col6">0.5022</oasis:entry>
         <oasis:entry colname="col7">0.6031</oasis:entry>
         <oasis:entry colname="col8">0.5788</oasis:entry>
         <oasis:entry colname="col9">0.5371</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Day</oasis:entry>
         <oasis:entry colname="col2">0.3222</oasis:entry>
         <oasis:entry colname="col3">0.2486</oasis:entry>
         <oasis:entry colname="col4">0.2699</oasis:entry>
         <oasis:entry colname="col5">0.3190</oasis:entry>
         <oasis:entry colname="col6">0.3081</oasis:entry>
         <oasis:entry colname="col7">0.5314</oasis:entry>
         <oasis:entry colname="col8">0.8110</oasis:entry>
         <oasis:entry colname="col9">0.6202</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Month</oasis:entry>
         <oasis:entry colname="col2">0.3194</oasis:entry>
         <oasis:entry colname="col3">0.2486</oasis:entry>
         <oasis:entry colname="col4">0.2752</oasis:entry>
         <oasis:entry colname="col5">0.3178</oasis:entry>
         <oasis:entry colname="col6">0.3100</oasis:entry>
         <oasis:entry colname="col7">0.5326</oasis:entry>
         <oasis:entry colname="col8">0.8110</oasis:entry>
         <oasis:entry colname="col9">0.6260</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Start_Date_Year</oasis:entry>
         <oasis:entry colname="col2">0.5916</oasis:entry>
         <oasis:entry colname="col3">0.3728</oasis:entry>
         <oasis:entry colname="col4">0.2888</oasis:entry>
         <oasis:entry colname="col5">0.4289</oasis:entry>
         <oasis:entry colname="col6">0.3161</oasis:entry>
         <oasis:entry colname="col7">0.6591</oasis:entry>
         <oasis:entry colname="col8">0.8171</oasis:entry>
         <oasis:entry colname="col9">0.6279</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">End_Date_Day</oasis:entry>
         <oasis:entry colname="col2">0.2728</oasis:entry>
         <oasis:entry colname="col3">0.1909</oasis:entry>
         <oasis:entry colname="col4">0.1962</oasis:entry>
         <oasis:entry colname="col5">0.1907</oasis:entry>
         <oasis:entry colname="col6">0.2207</oasis:entry>
         <oasis:entry colname="col7">0.4558</oasis:entry>
         <oasis:entry colname="col8">0.7530</oasis:entry>
         <oasis:entry colname="col9">0.5465</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">End_Date_Month</oasis:entry>
         <oasis:entry colname="col2">0.2743</oasis:entry>
         <oasis:entry colname="col3">0.1908</oasis:entry>
         <oasis:entry colname="col4">0.1962</oasis:entry>
         <oasis:entry colname="col5">0.1929</oasis:entry>
         <oasis:entry colname="col6">0.2204</oasis:entry>
         <oasis:entry colname="col7">0.4552</oasis:entry>
         <oasis:entry colname="col8">0.7530</oasis:entry>
         <oasis:entry colname="col9">0.5543</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">End_Date_Year</oasis:entry>
         <oasis:entry colname="col2">0.2915</oasis:entry>
         <oasis:entry colname="col3">0.1965</oasis:entry>
         <oasis:entry colname="col4">0.1962</oasis:entry>
         <oasis:entry colname="col5">0.2031</oasis:entry>
         <oasis:entry colname="col6">0.2249</oasis:entry>
         <oasis:entry colname="col7">0.4692</oasis:entry>
         <oasis:entry colname="col8">0.7561</oasis:entry>
         <oasis:entry colname="col9">0.5562</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Administrative_Area_Norm</oasis:entry>
         <oasis:entry colname="col2">0.7225</oasis:entry>
         <oasis:entry colname="col3">0.9162</oasis:entry>
         <oasis:entry colname="col4">0.9646</oasis:entry>
         <oasis:entry colname="col5">0.8858</oasis:entry>
         <oasis:entry colname="col6">0.9757</oasis:entry>
         <oasis:entry colname="col7">0.8629</oasis:entry>
         <oasis:entry colname="col8">0.9939</oasis:entry>
         <oasis:entry colname="col9">0.9806</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Locations_Norm</oasis:entry>
         <oasis:entry colname="col2">0.8528</oasis:entry>
         <oasis:entry colname="col3">0.9552</oasis:entry>
         <oasis:entry colname="col4">0.9714</oasis:entry>
         <oasis:entry colname="col5">0.9387</oasis:entry>
         <oasis:entry colname="col6">0.9886</oasis:entry>
         <oasis:entry colname="col7">0.9194</oasis:entry>
         <oasis:entry colname="col8">0.9939</oasis:entry>
         <oasis:entry colname="col9">1.0000</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Min</oasis:entry>
         <oasis:entry colname="col2">0.6245</oasis:entry>
         <oasis:entry colname="col3">0.4541</oasis:entry>
         <oasis:entry colname="col4">0.6117</oasis:entry>
         <oasis:entry colname="col5">0.6056</oasis:entry>
         <oasis:entry colname="col6">0.7288</oasis:entry>
         <oasis:entry colname="col7">0.5734</oasis:entry>
         <oasis:entry colname="col8">0.1925</oasis:entry>
         <oasis:entry colname="col9">0.3450</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Max</oasis:entry>
         <oasis:entry colname="col2">0.6247</oasis:entry>
         <oasis:entry colname="col3">0.4546</oasis:entry>
         <oasis:entry colname="col4">0.6115</oasis:entry>
         <oasis:entry colname="col5">0.6016</oasis:entry>
         <oasis:entry colname="col6">0.7289</oasis:entry>
         <oasis:entry colname="col7">0.5721</oasis:entry>
         <oasis:entry colname="col8">0.1921</oasis:entry>
         <oasis:entry colname="col9">0.3450</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Unit</oasis:entry>
         <oasis:entry colname="col2">NA</oasis:entry>
         <oasis:entry colname="col3">NA</oasis:entry>
         <oasis:entry colname="col4">NA</oasis:entry>
         <oasis:entry colname="col5">NA</oasis:entry>
         <oasis:entry colname="col6">NA</oasis:entry>
         <oasis:entry colname="col7">NA</oasis:entry>
         <oasis:entry colname="col8">0.2134</oasis:entry>
         <oasis:entry colname="col9">0.3837</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Inflation_Adjusted</oasis:entry>
         <oasis:entry colname="col2">NA</oasis:entry>
         <oasis:entry colname="col3">NA</oasis:entry>
         <oasis:entry colname="col4">NA</oasis:entry>
         <oasis:entry colname="col5">NA</oasis:entry>
         <oasis:entry colname="col6">NA</oasis:entry>
         <oasis:entry colname="col7">NA</oasis:entry>
         <oasis:entry colname="col8">0.2317</oasis:entry>
         <oasis:entry colname="col9">0.3876</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Num_Inflation_Adjusted_Year</oasis:entry>
         <oasis:entry colname="col2">NA</oasis:entry>
         <oasis:entry colname="col3">NA</oasis:entry>
         <oasis:entry colname="col4">NA</oasis:entry>
         <oasis:entry colname="col5">NA</oasis:entry>
         <oasis:entry colname="col6">NA</oasis:entry>
         <oasis:entry colname="col7">NA</oasis:entry>
         <oasis:entry colname="col8">0.0061</oasis:entry>
         <oasis:entry colname="col9">0.0097</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table><table-wrap-foot><p id="d2e4019">NA: not available.</p></table-wrap-foot></table-wrap>

      <p id="d2e4520">Overall, the L1 information extracted by the LLM thus provides the most reliable representation of the underlying Wikipedia articles, followed by L2 and L3. Within L1, event and timing data are highly accurate, while location data is less robust. The Deaths category in L1 has the lowest error, followed by Damage and Insured Damage, with other categories showing higher errors. In L2 and L3, the injuries, homeless, and displaced categories are most reliable. We underscore that the evaluation is conducted only the LLM output, not the final database entries. In the final entries, the output of the LLM may be corrected through post-processing, for example by aggregating L2 impact information to revise the corresponding L1 value. This is why we maintain the categories in the database even when the error scores are high (e.g., the Location_Norm of Damage in L3 with an error score of 1). For further discussion of the evaluation errors and database quality, we refer the reader to Sect. 6.1.</p>
</sec>
</sec>
<sec id="Ch1.S5">
  <label>5</label><title>Wikimpacts 1.0 Content of the Database</title>
      <p id="d2e4533">The Wikimpacts database, version 1.0, encompasses a total of 2726 events. These correspond to the subset of the 3146 events, each mapped to a single-event article (Sect. <xref ref-type="sec" rid="Ch1.S3.SS1"/>) for which all mandatory fields were completed. At the event level (L1), tropical cyclones are the dominant event type, constituting 56.93 % of events in the dataset (Fig. <xref ref-type="fig" rid="F4"/>a). They are followed by floods (13.1 %); tornadoes, wildfires, and extratropical storms also collectively account for a substantial portion of events. Droughts and extreme temperatures are less frequently recorded. The national level (L2) contains a total of 17,912 data entries and exhibits a similar distribution as L1 across event categories, although the share accounted for by tropical cyclones is increased (Fig. <xref ref-type="fig" rid="F4"/>b). At the sub-national level (L3), there are 32 343 data entries, with tropical cyclones again comprising the largest share of recorded entries at 65.62 %, followed by floods at 10.65 % and tornadoes at 10.01 % (Fig. <xref ref-type="fig" rid="F4"/>c). Notably, the Wikimpacts 1.0 database is constructed from events recorded in the English-language Wikipedia, and does not constitute an exhaustive record of all climate extremes.</p>

      <fig id="F4" specific-use="star"><label>Figure 4</label><caption><p id="d2e4546">Statistics overview of Wikimpacts 1.0. <bold>(a)</bold> Number of main events in L1, <bold>(b)</bold> number of impact data entries in L2 (national level), <bold>(c)</bold> number of impact data entries in L3 (sub-national level). Abbreviations are as follows: Extratropical Storm/Cyclone (Extrat. Cycl), Tropical Storm/Cyclone (Trop. Cycl), and Extreme Temperature (Extr. Temp.). These abbreviations are also used in subsequent Figs. <xref ref-type="fig" rid="F5"/> and <xref ref-type="fig" rid="F6"/>.</p></caption>
        <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f04.png"/>

      </fig>

<sec id="Ch1.S5.SS1">
  <label>5.1</label><title>L1 (Event Level)</title>
<sec id="Ch1.S5.SS1.SSS1">
  <label>5.1.1</label><title>Temporal Distribution</title>
      <p id="d2e4582">Figure <xref ref-type="fig" rid="F5"/>a presents the decadal trends of the number of events in Wikimpacts 1.0, with our database encompassing data from the years 1034 through 2024. Although entries from the early period, spanning the 1030s to the 1890s (Fig. <xref ref-type="fig" rid="F5"/>b), are limited, a discernible upward trend emerges in the 1850s. Nonetheless, as records prior to 1900 are sparse due to limited reporting, we view them as unsuitable for quantitative trend analyses. The number of recorded events continues to increase steadily until the 2010s. However, due to the 2020s data only covering January 2020 to February 2024, the number of events for the current decade is lower (Fig. <xref ref-type="fig" rid="F5"/>a). The upward trend in time is evident across all main event categories. Further research is needed to disentangle the potential causes for this increase (e.g., improved reporting, rising number of events, increased exposure).</p>

      <fig id="F5" specific-use="star"><label>Figure 5</label><caption><p id="d2e4593">The temporal distribution of main events (L1) in Wikimpacts 1.0. <bold>(a)</bold> The decadal distribution of main events in Wikimpacts 1.0 spanning all decades, from the 1030s to the 2020s, and <bold>(b)</bold> the decadal distribution of main events in Wikimpacts 1.0 during the early period, covering the 1030s to the 1890s. Note the discontinuous <inline-formula><mml:math id="M34" display="inline"><mml:mi>x</mml:mi></mml:math></inline-formula>-axis scale for the 1030s–1760s in both panels and the fact that the 2020s only include data up to February 2024.</p></caption>
            <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f05.png"/>

          </fig>

</sec>
<sec id="Ch1.S5.SS1.SSS2">
  <label>5.1.2</label><title>Impact Distribution</title>
      <p id="d2e4623">Tropical storms are the most frequently recorded events, and they indeed dominate the aggregated impacts for many impact categories with the number of injuries being a notable expection (Fig. <xref ref-type="fig" rid="F6"/>). However, there are several cases in which much less frequent main event categories display comparable aggregated impacts. For instance, droughts contribute to almost as many deaths as tropical cyclones, despite being over 140 times less frequent in our database (Fig. <xref ref-type="fig" rid="F6"/>a). The single most severe drought event reported is the “1983–1985 famine in Ethiopia” <xref ref-type="bibr" rid="bib1.bibx63" id="paren.50"/>, which led to approximately 1.2 million deaths. Floods and tropical storms also result in substantial numbers of deaths, and they are also among the most frequently recorded events in the database. Floods are also notable for causing the highest number of injuries (Fig. <xref ref-type="fig" rid="F6"/>b), followed by tropical storms and wildfires. There are no injury entries for droughts in our database. Floods rank second for the displaced and homeless impact categories, with extreme temperatures and tropical storms also playing a significant role (Fig. <xref ref-type="fig" rid="F6"/>c–d). Extreme temperatures rank second for total number of affected people and total damage (Fig. <xref ref-type="fig" rid="F6"/>e, h), while extratropical cyclones rank second for buildings damaged and insured damage (Fig. <xref ref-type="fig" rid="F6"/>f, g). Overall, tropical storms thus dominate the impacts recorded in our database, followed by floods. Nonetheless, all of the other main event categories also display substantial impacts in specific impact categories.</p>

      <fig id="F6" specific-use="star"><label>Figure 6</label><caption><p id="d2e4644">Total impact of each main event category in the Wikimpacts 1.0 database. Error bars represent the Max-Min range from L1 and the bar heights reflect the middle of the intervals from L1. <bold>(a)</bold> Deaths, <bold>(b)</bold> Injuries, <bold>(c)</bold> Homeless, <bold>(d)</bold> Displaced, <bold>(e)</bold> Affected, <bold>(f)</bold> Buildings Damaged, <bold>(g)</bold> Insured Damage, and <bold>(h)</bold> Total Damage. Note the logarithmic <inline-formula><mml:math id="M35" display="inline"><mml:mi>y</mml:mi></mml:math></inline-formula>-axis scale.</p></caption>
            <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f06.png"/>

          </fig>

</sec>
<sec id="Ch1.S5.SS1.SSS3">
  <label>5.1.3</label><title>Spatial Distribution</title>
      <p id="d2e4693">The database encompasses events globally, with the US (1140 events) exhibiting the highest number of occurrences (Fig. <xref ref-type="fig" rid="F7"/>a). Mexico, Canada, the Philippines, China, and Japan follow with 326, 305, 304, 284, and 261 events, respectively. Australia has 143 events, followed by Vietnam and the United Kingdom with 138 events recorded. There are comparatively fewer entries from the Global South (Comprising Africa, Latin America and the Caribbean, Asia excluding Israel, Japan, and South Korea, and Oceania excluding Australia and New Zealand, according to UN Trade and Development), particularly in Africa and South America. While event entries remain limited also in Europe, they remain more numerous than for many Global South regions.</p>

      <fig id="F7" specific-use="star"><label>Figure 7</label><caption><p id="d2e4700">Spatial distribution of main events in the Wikimpacts 1.0 database, based on L1 entries: <bold>(a)</bold> spatial distribution of all main events, <bold>(b)</bold> spatial distribution of Tropical Storm/Cyclone events, <bold>(c)</bold> spatial distribution of Extratropical Storm/Cyclone events, <bold>(d)</bold> spatial distribution of Flood events, <bold>(e)</bold> spatial distribution of Tornado events, <bold>(f)</bold> spatial distribution of Extreme Temperature events, <bold>(g)</bold> spatial distribution of Wildfire events, and <bold>(h)</bold> spatial distribution of Drought events. Note the non-linear colour scale.</p></caption>
            <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f07.png"/>

          </fig>

      <p id="d2e4734">The spatial distribution of main events for individual event categories (Fig. <xref ref-type="fig" rid="F7"/>b–h) largely mirrors the spatial distribution of all main events (Fig. <xref ref-type="fig" rid="F7"/>a). Tropical storms are documented in most countries, with exceptions including Argentina, Inner Mongolia, and several Central Asian nations. The US leads in tropical storm entries with 543 events, followed by Mexico (305 events), the Philippines (295 events), China (249 events) and Japan (246 events) (Fig. <xref ref-type="fig" rid="F7"/>b). While we report impacts from tropical storms in several mid-latitude countries, the number of such events is low. In most cases, they refer to tropical cyclones that underwent an extratropical transition. If the impacts of the cyclone following the extratropical transition are recorded in the Wikipedia article, we ascribe those impacts to the “Tropical Cyclone” main event category. Examples include “Hurricane Nate (2005)” <xref ref-type="bibr" rid="bib1.bibx52" id="paren.51"/> and “Hurricane Larry” <xref ref-type="bibr" rid="bib1.bibx57" id="paren.52"/>, the latter even impacting Greenland. For extratropical storms (Fig. <xref ref-type="fig" rid="F7"/>c), the majority of entries are in the US (129 events) and Canada (77 events), followed by the UK (56 events), France (42 events), Germany (37 events), Ireland (32 events), the Netherlands (29 events), Belgium (21 events), Spain (19 events), and Italy (17 events). The database contains no entries for extratropical storms in Southeast Asia and some Central Asian countries. However, a few entries are present for Africa. Further investigation reveals that the latter may be an ambiguous classification between the main event categories of flood and extratropical storm/cyclone. For example, the event “2011 European floods” <xref ref-type="bibr" rid="bib1.bibx56" id="paren.53"/> – despite the article's title – also impacted North Africa. The floods were caused by a series of storms, and in our database this main event is categorised as extratropical cyclone. We identify 26 similar cases in our database, for which the main event type is extratropical storm/cyclone and the hazard column lists “flood”, yet the article title contains “flood”. We also find one article, the “1999 Blayais Nuclear Power Plant flood” <xref ref-type="bibr" rid="bib1.bibx55" id="paren.54"/> for which the hazard is “NULL”. We additionally find 26 cases in which the article title contains “flood”, but the Main Event category is tropical storm/cyclone. Finally, we find 15 cases in which the article title suggests a cold wave, but the Main Event category is extratropical storm/cyclone rather than extreme temperature. For all these events, we keep the Main Event category as detected by the LLM. This type of classification affects around 2.5 % of the main events in our database. In terms of floods (Fig. <xref ref-type="fig" rid="F7"/>d), the US (80 events) and India (42 events) have the most entries, followed by China (20 events), Canada (18 events), the UK (15 events), Pakistan (15 events), Australia (13 events), and Germany and Afghanistan (11 events each). Many African and South American countries have only a single flood entry. Regarding tornadoes (Fig. <xref ref-type="fig" rid="F7"/>e), the US (239 events) has the highest number of entries, followed by Canada (24 events) and the UK (9 events). Most African countries lack recorded events for tornadoes. Extreme temperature events are primarily recorded in the US (25 events), Canada (16 events), and the UK (10 events). There are limited entries for extreme temperatures in African countries (Fig. <xref ref-type="fig" rid="F7"/>f), despite this continent being known for extreme heat episodes <xref ref-type="bibr" rid="bib1.bibx31 bib1.bibx18 bib1.bibx47" id="paren.55"/>). For wildfires (Fig. <xref ref-type="fig" rid="F7"/>g), the US (123 events) and Australia (34 events) have the highest number of entries. Wildfire reports are sparse in African countries, Central Asia, Northern Europe, and South America, despite several of these regions being fire-prone <xref ref-type="bibr" rid="bib1.bibx4" id="paren.56"/>. Lastly, droughts (Fig. <xref ref-type="fig" rid="F7"/>h), which have the fewest entries in the database (11 events) but often span several countries, are most frequently recorded in Russia, France, and Australia (2 events each).</p>

      <fig id="F8" specific-use="star"><label>Figure 8</label><caption><p id="d2e4778">Spatial distribution of L2 and L3 impact data entries in Wikimpacts 1.0. <bold>(a)</bold> Spatial distribution of impact data entries at national level(L2), <bold>(b)</bold> spatial distribution of impact data entries at regional level (L3 polygons, see text), and <bold>(c)</bold> spatial distribution of impact data entries at city level (L3 points, see text).</p></caption>
            <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f08.png"/>

          </fig>

      <fig id="F9" specific-use="star"><label>Figure 9</label><caption><p id="d2e4798">Impact data entry comparison between EM-DAT and Wikimpacts 1.0 from 1 January 1900–29 February 2024. <bold>(a)</bold> Number of impact data entries in EM-DAT (in hatched colors) and Wikimpacts 1.0 (in full colors) for each main event category in Wikimpacts 1.0. Note that the EM-DAT Storm category includes all storm-related entries, whereas for Wikimpacts only the Tropical Storm/Cyclone and Extratropical Storm/Cyclone categories are included. <bold>(b)</bold> Spatial distribution of the difference (Wikimpacts 1.0 minus EM-DAT) in number of impact data entries after aggregation across main event categories. Note the non-linear colour scale.</p></caption>
            <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f09.png"/>

          </fig>

      <fig id="F10" specific-use="star"><label>Figure 10</label><caption><p id="d2e4815">Impact value comparison between EM-DAT and Wikimpacts 1.0 over 1 January 1900–29 February 2024. Blue indicates cases where the Wikimpacts impact values are lower than the EM-DAT values, whereas red indicates the opposite. <bold>(a)</bold> The percentage difference between Wikimpacts 1.0 and EM-DAT in the death category, <bold>(b)</bold> injury category, <bold>(c)</bold> homeless category, and <bold>(d)</bold> damage category.</p></caption>
            <graphic xlink:href="https://nhess.copernicus.org/articles/26/2609/2026/nhess-26-2609-2026-f10.png"/>

          </fig>

</sec>
</sec>
<sec id="Ch1.S5.SS2">
  <label>5.2</label><title>L2 Impact Data (National Level)</title>
      <p id="d2e4846">We next investigate the spatial distribution of national-level (L2) impact data entries (Fig. <xref ref-type="fig" rid="F8"/>a). In total, we have 17 912 such entries, with the US having the highest number (4071 entries in total). They are followed by the Philippines with 1174 data entries, Mexico with 1170, Japan with 1003, China with 884, Australia with 515, and Canada with 486. Most African countries display a limited number of impact data entries, with some exceptions such as Madagascar (208 entries). This largely reflects the spatial distribution of the main events (Sect. <xref ref-type="sec" rid="Ch1.S5.SS1.SSS3"/>). Furthermore, a limited number of data entries is observed in parts of Western Latin America, Eastern Europe, and Central Asia.</p>
</sec>
<sec id="Ch1.S5.SS3">
  <label>5.3</label><title>L3 Impact Data (Sub-national Level)</title>
      <p id="d2e4861">The L3 information in our database reflects impact data reported at sub-national level, which we visualise in Fig. <xref ref-type="fig" rid="F8"/>b–c. In total, there are 32 343 entries in L3, and 9 entries contain unexpected GeoJSON shapes, such as ocean shapefiles of the Arabian Sea, which were subsequently removed for visualization purposes (see Sect. S9). The US leads with 10 994 sub-national level entries, followed by Mexico, Japan, the Philippines, China, Australia, India, and Canada, with 2385, 2334, 1845, 1306, 1012, 933, and 694 entries, respectively. Vietnam and Cuba have fewer entries, with 505 and 355 entries, respectively. The GeoJSON files include both polygons and points, where polygons often represent larger administrative areas such as states or provinces (here referred to as “Regions”). Points typically represent cities, towns, or villages (here referred to as “Cities”) for which OpenStreetMap could not find a GeoJSON object of a non-Point shape (such as Polygon or MultiPolygon). In some cases, when a region cannot be represented by a polygon or multi-polygon shape, it is recorded as a point location in our database. The “Regions” map (Fig. <xref ref-type="fig" rid="F8"/>b) indicates that not all states or provinces within a country have recorded impacts (Fig. <xref ref-type="fig" rid="F8"/>b). In some countries, such as China, impacts predominantly occur in coastal regions, with Fujian province having the highest number of data entries at 141, followed by Zhejiang province with 79 entries. In contrast, in the US impacts are distributed across most states, with Delaware having the highest number of entries at 98. In Mexico, a few states have a large number of data entries, like Acapulco (116 entries). In contrast, sub-national impact entries for African countries are limited, particularly in Central and Northern Africa. We observe a similar pattern in Western Latin America. In the “Cities” map, the distribution of impact data entries is more concentrated (Fig. <xref ref-type="fig" rid="F8"/>c). Most entries are of events that occurred in the US, with Outer Banks having the highest number of entries (34), followed by East Texas with 17 entries. Notably, Cabo San Lucas in Mexico also has a large number of data entries, with 27 entries. In Africa, the sub-national impact data entries are concentrated in coastal regions of South, East, and West Africa, whereas in South America, city-level impact data entries appear to be limited.</p>
</sec>
<sec id="Ch1.S5.SS4">
  <label>5.4</label><title>Comparison With EM-DAT</title>
      <p id="d2e4880">We compare the coverage of Wikimpacts 1.0 to the widely-used EM-DAT impact database. As a first step, we align our database's time span with that of EM-DAT (1 January 1900–29 February 2024). To compare the most detailed available level in each dataset, we benchmark the number of impact data entries at L3 between our database and EM-DAT. To ensure a fair comparison, we assign one entry per impact field present in EM-DAT, and EM-DAT disaster subtypes are mapped to our main event categories (see Sect. S6). We specifically map the Tropical Cyclone category in EM-DAT to our Tropical Storm/Cyclone category, and the Extra-Tropical Storm category in EM-DAT to our Extratropical Storm/Cyclone category. Additionally, we aggregate all storm-related entries in EM-DAT and compare this with the combined total of Tropical Storm/Cyclone and Extratropical Storm/Clone categories in our database. For the spatial comparison, we utilize ISO codes from EM-DAT and the Administrative_Areas_GID identifiers from our database.</p>
      <p id="d2e4883">In total, the EM-DAT database contains 35 502 impact data entries, whereas the Wikimpacts 1.0 database comprises 31 405 data entries for the same period. The Wikimpacts 1.0 database includes a greater number of data entries for main event types such as tropical storms (12 767 more entries), extratropical storms (1895 more), tornadoes (1925 more), and wildfires (291 more) (Fig. <xref ref-type="fig" rid="F9"/>a). Notably, our database has 10 280 more entries for storms overall even when considering all storm-related entries in EM-DAT. However, our database contains substantially fewer data entries for floods (fewer by 14 619), as well as fewer data entries for droughts (fewer by 1370) and extreme temperature events (fewer by 618). From a spatial distribution perspective (see Fig. <xref ref-type="fig" rid="F9"/>b), our database contains more impact data entries in the US (7362 more entries), Mexico (1724 more entries), Japan (1456 more entries), Canada (368 more entries), and Australia (293 more entries), as well as in a few countries in Northern Europe and Africa. In contrast, Wikimpacts 1.0 contains fewer impact data entries in most countries in Africa, South America, and Asia. For example, there are fewer data entries in China (1139 fewer), Indonesia (787 fewer), India (697 fewer), Bangladesh (670 fewer), Brazil (562 fewer), Vietnam (448 fewer), and Thailand (373 fewer). Despite these regional differences in coverage, both datasets overall suffer from a spatial reporting biased towards the Global North.</p>
      <p id="d2e4890">We also perform an event-by-event matching between EM-DAT and Wikimpacts. We select four impact categories (deaths, injuries, homeless, and total damage), and compare the L2 data in our database to the country-level impacts from EM-DAT. For each event and each impact variable, we compute the relative difference as ((Wikimpacts impact value <inline-formula><mml:math id="M36" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula> EM-DAT impact value) <inline-formula><mml:math id="M37" display="inline"><mml:mo>/</mml:mo></mml:math></inline-formula> EM-DAT impact value <inline-formula><mml:math id="M38" display="inline"><mml:mo>×</mml:mo></mml:math></inline-formula> 100 %), which quantifies how much the Wikimpacts value differs from the corresponding EM-DAT value. Events are precisely matched based on ISO code (Administrative_Areas_GID), main event type, and exact start/end year and month. We then classify the events depending on whether the impact entries match, or by how much they differ. The comparison is illustrated in Fig. <xref ref-type="fig" rid="F10"/>. In the deaths category, 32 out of 179 matched events exhibit identical values with EM-DAT. Of the remaining events, 38 show higher values by 50 % or more, and 47 show lower values by 50 % or more compared to EM-DAT. In the injury category, 7 out of 77 events perfectly align with EM-DAT values; over one-third of the events exhibit values at least 50 % higher than EM-DAT. For the homeless and damage categories, no events display the same impact values. More events in the homeless category have lower values than EM-DAT, while nearly 94 % in the damage category show higher values than EM-DAT.</p>
</sec>
</sec>
<sec id="Ch1.S6">
  <label>6</label><title>Discussion</title>
<sec id="Ch1.S6.SS1">
  <label>6.1</label><title>Database Quality Assessment</title>
      <p id="d2e4932">The pipeline of the Wikimpacts 1.0 database is designed to capture information contained in Wikipedia articles as accurately as possible. In this respect, the performance of the GPT4o model is crucial for determining the database's quality and robustness. The GPT4o model exhibits strong performance across all three levels of information (see Sects. <xref ref-type="sec" rid="Ch1.S4.SS3"/>, S4 and S5). L1 data is the most robust and reliable, displaying the lowest error rate among the three levels, with the errors increasing as the spatial scale of the reported impacts decreases. L3 data entries display the highest errors. Nonetheless, even for L1, the error rate for location information is high, with a score of 0.48 in Administrative_Areas_Norm across 156 events. We find that 35 NULL penalties, each scoring 1 for the corresponding attribute, account for nearly 46 % of the total error score. Similarly, NULL penalties in the L2 and L3 location information lead to high error scores in these location-related fields. During the consolidation process, we filter out these entries. Moreover, we do not compare the results obtained after consolidation with the gold standard, because, as described in Sect. 3.4, the data are processed from L3 to L2 to L1, and the resulting processed data no longer match the originally annotated data. Thus, the extraction errors from the LLM do not necessarily propagate to the final version of the database. The reasons for these differences are explored in detail in the following error analysis.</p>
<sec id="Ch1.S6.SS1.SSS1">
  <label>6.1.1</label><title>L1 (Event Level)</title>
      <p id="d2e4944">Fields like event timing, main event category, total deaths, and total damage exhibit very low error rates, closely aligning with the gold standard database (Table <xref ref-type="table" rid="T6"/>). Analysing the articles used for model input, we find that most articles in both the development and test sets contain an “Info_Box” that may often include information on the start and end date, the total number of deaths or injuries, or information on the total damage or insured damage. Specifically, 69 out of 70 articles in the development set and 151 out of 156 articles in the test set contain an Info_Box. An example of the Info_Box for the 2021 European Floods can be found in Sect. S1. In addition, the “Event_Name” is directly extracted from the article title and fed to the model. Consequently, for the aforementioned four categories, the model is able to extract information with ease.</p>
      <p id="d2e4949">For the Hazards field, the model occasionally captures undefined hazards, such as “Landslide”, or mixes hazards from one Main Event type with another. For example, it captures “Flood<inline-formula><mml:math id="M39" display="inline"><mml:mo>|</mml:mo></mml:math></inline-formula>Lightning” in a flood event where only “Flood” is defined as the hazard. In the evaluation process, this is given an error rate of 0.5. Consequently, the hazard field exhibits a higher error rate than the Main Event field. For the Administrative_Areas_Norm field, the model performs worse in the test set than in the development set, with the error rate approximately doubling. Notably, in the test set, 35 instances of the “Administrative_Areas” output exhibit an invalid JSON structure that deviates from the prompt-designed output structure used in the development set. Consequently, these outputs cannot be normalized during the evaluation process and are assigned a NULL penalty score of 1. This accounts for the increased error rate for this field in the test set compared to the development set.</p>
      <p id="d2e4959">For the impact categories, a major source of error arises from the model incorrectly capturing information from other levels. For instance, in the event “Cyclone Vayu” <xref ref-type="bibr" rid="bib1.bibx59" id="paren.57"/>, the article states that “Approximately 300 000 residents of coastal Gujarat were evacuated on 12 June in preparation for the system's arrival”. The model captures “Approximately 300 000” as the L1 total displaced information, which according to our definition of levels represents sub-national impact data and should therefore be recorded in L3. For similar reasons, in the test set, the model incurs NULL penalty scores for 46 entries in the “displaced” field, 33 entries in injuries, 39 in homeless, 47 in affected, 43 in buildings damaged, and 19 in total insured damage. This highlights that a large part of the L1 error rate for impact fields arises from impact information being correctly captured but assigned to the wrong spatial level.</p>
</sec>
<sec id="Ch1.S6.SS1.SSS2">
  <label>6.1.2</label><title>L2 (National Level) and L3 (Sub-national Level) Information Extraction</title>
      <p id="d2e4973">The model performance for L2 and L3 is generally worse than that for L1 (Sect. <xref ref-type="sec" rid="Ch1.S4.SS3"/>). During the matching process, an empty entry is added to the LLM output if the model fails to capture information recorded in the gold standard data. Similarly, if the model captures information absent in the gold standard data, an empty entry is created in the gold standard data. Both cases result in the highest possible error rate – a NULL penalty score of “1”.</p>
      <p id="d2e4978">To investigate this further, we analyse the number of entries in L2 and L3 for both the gold standard data and the LLM output (Table <xref ref-type="table" rid="T9"/>). We find that the LLM output contains more information on average than the gold standard data, which can be attributed to a variety of reasons. First, we observe a similar error type to that seen in L1 information extraction: the model sometimes assigns sub-national information to L2 instead of L3. A similar issue occurs in L3, where the model occasionally assigns country names to sub-national locations. Second, the model does not always adhere to the defined impact categories. For example, it may capture “about 600 houses without electricity” in the “Affected” field, which does not align with our definition that requires explicit mentions of keywords (see Table <xref ref-type="table" rid="T5"/>). We recognise that, in some cases, this may highlight shortcomings of our keyword list rather than erroneous information extraction by the model.</p>
      <p id="d2e4985">Finally, we examine the location-related fields, which have the highest error rates among all fields in each impact category. The model often outputs “NULL” in the “Num” impact field when location data is present, yet impact data is absent. This results in 2188 “NULL” values present among 5413 L2 and L3 output entries. For these entries, the model incurs a NULL penalty score for the location-related field, leading to a higher error rate.</p>

<table-wrap id="T9"><label>Table 9</label><caption><p id="d2e4992">Comparison of the average number of entries at the L2 and L3 levels for the Large Language Model (LLM) output and the gold standard data (Gold).</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="5">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="center"/>
     <oasis:colspec colnum="3" colname="col3" align="center" colsep="1"/>
     <oasis:colspec colnum="4" colname="col4" align="center"/>
     <oasis:colspec colnum="5" colname="col5" align="center"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry rowsep="1" namest="col2" nameend="col3" colsep="1">L2 </oasis:entry>
         <oasis:entry rowsep="1" namest="col4" nameend="col5">L3 </oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">LLM</oasis:entry>
         <oasis:entry colname="col3">Gold</oasis:entry>
         <oasis:entry colname="col4">LLM</oasis:entry>
         <oasis:entry colname="col5">Gold</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Deaths</oasis:entry>
         <oasis:entry colname="col2">1.60</oasis:entry>
         <oasis:entry colname="col3">0.89</oasis:entry>
         <oasis:entry colname="col4">2.88</oasis:entry>
         <oasis:entry colname="col5">2.16</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Injuries</oasis:entry>
         <oasis:entry colname="col2">1.47</oasis:entry>
         <oasis:entry colname="col3">0.22</oasis:entry>
         <oasis:entry colname="col4">1.96</oasis:entry>
         <oasis:entry colname="col5">0.48</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Homeless</oasis:entry>
         <oasis:entry colname="col2">1.50</oasis:entry>
         <oasis:entry colname="col3">0.08</oasis:entry>
         <oasis:entry colname="col4">2.35</oasis:entry>
         <oasis:entry colname="col5">0.09</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Displaced</oasis:entry>
         <oasis:entry colname="col2">1.62</oasis:entry>
         <oasis:entry colname="col3">0.19</oasis:entry>
         <oasis:entry colname="col4">2.28</oasis:entry>
         <oasis:entry colname="col5">0.58</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Affected</oasis:entry>
         <oasis:entry colname="col2">1.96</oasis:entry>
         <oasis:entry colname="col3">0.14</oasis:entry>
         <oasis:entry colname="col4">4.21</oasis:entry>
         <oasis:entry colname="col5">0.12</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Buildings Damaged</oasis:entry>
         <oasis:entry colname="col2">1.89</oasis:entry>
         <oasis:entry colname="col3">0.38</oasis:entry>
         <oasis:entry colname="col4">3.12</oasis:entry>
         <oasis:entry colname="col5">1.22</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Insured Damage</oasis:entry>
         <oasis:entry colname="col2">1.42</oasis:entry>
         <oasis:entry colname="col3">0.03</oasis:entry>
         <oasis:entry colname="col4">2.09</oasis:entry>
         <oasis:entry colname="col5">0.03</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Damage</oasis:entry>
         <oasis:entry colname="col2">1.56</oasis:entry>
         <oasis:entry colname="col3">0.51</oasis:entry>
         <oasis:entry colname="col4">2.85</oasis:entry>
         <oasis:entry colname="col5">0.78</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

</sec>
<sec id="Ch1.S6.SS1.SSS3">
  <label>6.1.3</label><title>Quality Improvement with Consolidation</title>
      <p id="d2e5198">Overall, the model's capability to capture and classify impact information varies across levels and entry categories. We address this challenge by automatically filtering main event types (e.g., geomagnetic storm) and hazards (e.g., landslide) not matching our predefined categories and by completing missing information through aggregation from L3 to L2 and from L2 to L1 (Sects. <xref ref-type="sec" rid="Ch1.S3.SS4"/> and S8). Here, we use the Typhoon Kate (1970) event <xref ref-type="bibr" rid="bib1.bibx60" id="paren.58"/> in the evaluation-score computation to illustrate how the consolidation process can improve database quality. For this event, there are 631 recorded fatalities in total; this is the only information available in the annotated data. However, the LLM also extracts 631 deaths in the Philippines at L2 and 631 deaths in southern Mindanao, Philippines, at L3. Under our evaluation protocol, these additional details are assigned NULL penalties, although correct, because they were missed by the annotators and are not present in the ground-truth annotations. In the consolidation process, the L2 and L3 information is recognized as consistent with L1, so these more detailed records are preserved in the database. The consolidation does not address issues such as misclassification of impact categories. Nonetheless, thanks to the consolidation steps many of the issues detailed in Sects. <xref ref-type="sec" rid="Ch1.S6.SS1.SSS1"/> and <xref ref-type="sec" rid="Ch1.S6.SS1.SSS2"/> are resolved in the final version of the database.</p>
</sec>
</sec>
<sec id="Ch1.S6.SS2">
  <label>6.2</label><title>Comparison with Existing Impact Databases</title>
      <p id="d2e5219">We endeavoured to conduct a fair comparison between EM-DAT and Wikimpacts, even though the databases differ in structure and in the categorisation of main events. EM-DAT has some level of standardization, using ISO/UN regions, and refers to GAUL administrative units. The weakness of EM-DAT is that the impact is not disaggregated between identified sub-national units. Our database generally contains more detailed information than EM-DAT, such as standardised impact data at a sub-national level, despite having fewer impact data entries than EM-DAT in many countries. The two databases further display very different distributions of the impact information across the different event categories. The total number of impact data entries between the two databases is nonetheless comparable, as are their biases in geographical coverage. When assessing the impact values, matching records can be noted for death and injury information, although significant discrepancies are observed in the data for homelessness and damage.</p>
      <p id="d2e5222">Notably, the substantial differences in both event coverage and impacts for matched events between Wikimpacts and EM-DAT do not necessarily arise from extraction errors in our pipeline. They may also issue from divergent event definitions, inclusion thresholds and criteria for impact data, differences in impact sources, and differences in the definitions and components of impact categories. Moreover, in this study we did not conduct a systematic comparison with other existing databases, such as DesInventar, but previous work shows large discrepancies between DesInventar and EM-DAT <xref ref-type="bibr" rid="bib1.bibx70 bib1.bibx36" id="paren.59"/>. We therefore recommend using our database as a complementary resource to existing databases. Furthermore, when matching events across different databases, we suggest testing different matching algorithms, for example based on event names and by allowing temporal buffers in event dates, in order to more reliably identify corresponding events across databases.</p>
      <p id="d2e5228">We next return to the broader challenges that we outlined in the introduction related to the currently available impact data for climate-related hazards. We argue that Wikimpacts 1.0 presents clear advances in several of those respects. First, it addresses the issue of non-standardised geographical information by including event-level and national-level impact data, and standardised information for sub-national impact data. This also prevents the issue of the same large-scale main event, e.g. a heatwave, being included in the database as several distinct events if it affected different countries. Second, Wikimpacts 1.0 is readily expandable thanks to its highly automated pipeline. Third, data in Wikimpacts 1.0 is traceable, as our database includes a Sources field for each impact entry. We also assign a range to our quantitative data when exact information is not provided in the underlying data source, enabling uncertainty-aware impact analyses. Finally, the database is fully reproducible (as long as the proprietary LLM models used remain available for use), since we openly share both the database itself and the source code of our processing pipeline.</p>
</sec>
<sec id="Ch1.S6.SS3">
  <label>6.3</label><title>Limitations</title>
      <p id="d2e5239">While Wikimpacts 1.0 innovates over existing databases in many aspects, it nonetheless comes with a number of caveats. First, the geographical coverage of the impact data remains uneven. We find that the exclusive use of English-language Wikipedia articles is likely not the main driver of this, as most of the reported events in other language editions of Wikipedia are also reported in English. While English-language bias does exists in our database, we thus do not view it as the primary source of overall geographical bias. We instead hypothesise that the reduced coverage in the Global South issues from less reporting of extreme events through Wikipedia, regardless of language. Related to this, for the events that are reported, there are many missing data for the different impact categories. Moreover, the pre-1900 records in Wikimpacts 1.0 database are limited, and future versions of Wikimpacts database will aim to include available historical events prior to 1900. Second, the coverage across main event categories is uneven, with comparatively few data entries for some categories like extreme temperatures and droughts. This may be partly due to the difficulty of assigning quantitative impacts to these events as their detrimental effects often occur on relatively long timescales and can be indirect. Moreover, certain hazards, such as landslides, are not included in our database. In addition, our pipeline, while scoring highly on the evaluation metrics, nonetheless introduces some errors relative to the original information provided by the Wikipedia articles we use. Systematic errors introduced by the LLM-based extraction, such as misclassification of L2 and L3 information, may lead to duplicate entries in the database. The extracted information is also sensitive to the specific LLM employed. The full Wikimpacts 1.0 database was generated using the state-of-the-art GPT-4o model available in 2024. The GPT family has continued to evolve since then; however, newer GPT versions are not evaluated in this work because we aim to fine-tune open source LLMs for the future live updates. Furthermore, we only provide information on the hazard causing the impacts at L1 level, while the database lacks L2 and L3 hazard information. The database focuses on direct impacts, and overlooks indirect or cascading impacts unless these fit into one of the predefined impact categories. Finally, the database's reliability is inherently tied to the quality of Wikipedia articles, as we perform no additional verification of the sources beyond what Wikipedia does. Nevertheless, the Wikimpacts 1.0 database is suitable for global impact-database benchmarking, exploratory sub-national impact assessment, and risk modeling in data-rich contexts (e.g., tropical storm/cylone events in the United States). However, it should be used with caution in applications that are sensitive to completeness or that focus on local or small-scale events. Further research could aim at addressing some of these limitations, for instance by expanding the database to multi-event Wikipedia articles, other Wikipedia languages or online textual sources beyond Wikipedia.</p>
</sec>
</sec>
<sec id="Ch1.S7" sec-type="conclusions">
  <label>7</label><title>Conclusion</title>
      <p id="d2e5251">The open access Wikimpacts 1.0 database encompasses 2726 climate events spanning the period 1034 to 2024, with global coverage. There is, however, a clear bias towards events in the Global North, specific event categories (notably tropical storms/cyclones) and more recent decades (from the 1950s onwards). We benchmark Wikimpacts 1.0 against the existing EM-DAT database, and find both agreements and notable differences. Wikimpacts 1.0 presents several innovations over the state of the art in multi-hazard global climate impact databases. The principal innovation is that, for each extreme event, the database provides hierarchical information on the impacts, enabling multi-scale impact analyses and climate risk and vulnerability assessments. The data is provided at three different spatial levels: aggregated over the whole event (L1; 2726 data entries), aggregated per affected country (L2; 17 912 data entries), and at the most highly spatially resolved information provided by the textual sources (L3; 32 343 data entries). The innovative automated pipeline ensures that the database is readily updateable and expandable with the inclusion of additional textual sources. Finally, each impact information is linked to the original source, ensuring verifiability of the information provided.</p>
</sec>

      
      </body>
    <back><notes notes-type="codeavailability"><title>Code availability</title>

      <p id="d2e5258">Code is available at <ext-link xlink:href="https://doi.org/10.5281/zenodo.19428787" ext-link-type="DOI">10.5281/zenodo.19428787</ext-link> <xref ref-type="bibr" rid="bib1.bibx26" id="paren.60"/>.</p>
  </notes><notes notes-type="dataavailability"><title>Data availability</title>

      <p id="d2e5271">The Wikimpacts 1.0 dataset comprises approximately 1.5 GB of data in SQLite database format and is publicly accessible via an open-access database server under the Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International (CC BY-NC-SA 4.0). A static version of the database as used in this paper is available at <ext-link xlink:href="https://doi.org/10.17043/li-2025-wikimpacts-1.0.final" ext-link-type="DOI">10.17043/li-2025-wikimpacts-1.0.final</ext-link> <xref ref-type="bibr" rid="bib1.bibx25" id="paren.61"/>. Furthermore, we direct readers to explore the various database releases at <uri>https://github.com/VUB-HYDR/Wikimpacts</uri> (last access: 20 May 2026, <xref ref-type="bibr" rid="bib1.bibx26" id="altparen.62"/>, <ext-link xlink:href="https://doi.org/10.5281/zenodo.19428787" ext-link-type="DOI">10.5281/zenodo.19428787</ext-link>), which include the raw outputs from the LLMs, as well as subsequent processing steps related to currency conversion and inflation adjustment. Lastly, we provide the <uri>https://www.wikimpacts.eu/</uri> (last access: 20 May 2026) for visualization and access for future updates of the database.</p>
  </notes><app-group>
        <supplementary-material position="anchor"><p id="d2e5293">The supplement related to this article is available online at <inline-supplementary-material xlink:href="https://doi.org/10.5194/nhess-26-2609-2026-supplement" xlink:title="pdf">https://doi.org/10.5194/nhess-26-2609-2026-supplement</inline-supplementary-material>.</p></supplementary-material>
        </app-group><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e5302">NL, WT, SZ, MMdB, SL, CF, JN and GM designed the analysis. NL conducted the LLM experiments, designed and plotted the figures and wrote the first draft of the manuscript under the supervision of WT. SZ wrote the database software pipeline with the support of NL and MK. KW and GM established the normalization rules for numeric information. KW supported part of their implementation in the software. JN and GM supervised the implementation of the software and database structure. KW, CF, and CT coordinated and implemented the manual data annotation. PM designed the website with the support of WT and NL. JZ provided guidance and contributed to discussions. All authors provided guidance on the analysis and contributed to writing the manuscript.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e5308">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e5315">Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. The authors bear the ultimate responsibility for providing appropriate place names. Views expressed in the text are those of the authors and do not necessarily reflect the views of the publisher.</p>
  </notes><ack><title>Acknowledgements</title><p id="d2e5321">We thank Davide Faranda, Aglaé Jezequel and Olof Görnerup for the valuable discussions about this project. We thank the EM-DAT project team, and specifically Niko Speybroeck, Valentin Wathelet and Regina Below for guidance on our database consolidation process. We thank Johan Tengholm and Jacob Nelsone for their work on annotating textual data. Compute and storage resources and services used in this work were provided by the VSC (Flemish Supercomputer Center), funded by the Research Foundation – Flanders (FWO) and the Flemish Government, and by Research Institutes of Sweden AB. Ni Li is supported by the VUB Research Council in the framework of a EUTOPIA inter-university co-tutelle PhD between the Vrije Universiteit Brussel, Belgium, and TU Dresden, Germany. The EUTOPIA alliance is part of the European Universities Initiatives co-funded by the European Union. WT acknowledges funding from the European Research Council (ERC) under the European Union's Horizon Framework research and innovation programme (grant agreement no. 101124572; ERC Consolidator Grant “LACRIMA”), and further funding from the European Union under the grant agreement no. 101081369 (SPARCCLE). GM, JN and MK acknowledge funding from the Swedish Research Council Vetenskapsrådet (grant no. 2022-06599, climes). GM, JN, KW and SZ acknowledge funding from the Swedish Research Council Vetenskapsrådet (grant no. 2022-03448). GM, CF and KW acknowledge funding from the European Research Council (ERC) under the European Union's Horizon Framework research and innovation programme (grant agreement no. 101112727). Lastly, we thank OpenAI Researcher Access Program for allocating 5000$ API credits for the GPT application and text rephrasing support.</p></ack><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e5326">This research has been supported by the HORIZON EUROPE European Research Council (grant nos. 101124572 and 101112727) and the Vetenskapsrådet (grant nos. 2022-06599 and 2022-03448).</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e5332">This paper was edited by Christos Giannaros and reviewed by two anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bibx1"><label>Alencar et al.(2024)</label><mixed-citation>Alencar, P. H., Sodoge, J., Paton, E., and Madruga de Brito, M.: Flash droughts and their impacts–using newspaper articles to assess the perceived  consequences of rapidly emerging droughts, Environ. Res. Lett., 19, 074048, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/ad58fa" ext-link-type="DOI">10.1088/1748-9326/ad58fa</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx2"><label>Antweiler(2026)</label><mixed-citation>Antweiler, W.: PACIFIC Exchange Rate Service, University of British Columbia, Sauder School of Business, <uri>https://fx.sauder.ubc.ca</uri> (last access: 20 May 2026), 2026.</mixed-citation></ref>
      <ref id="bib1.bibx3"><label>Begum et al.(2022)</label><mixed-citation>Begum, R. A., Lempert, R., Ali, E., Benjaminsen, T. A., Bernauer, T., Cramer, W., Cui, X., Mach, K., Nagy, G., Stenseth, N. C., Sukumar, R., and Wester, P.: Point of Departure and Key Concepts, in: Climate Change 2022: Impacts, Adaptation and Vulnerability. Contribution of Working Group II to  the Sixth Assessment Report of the Intergovernmental Panel on Climate Change, edited by: Pörtner, H.-O., Roberts, D. C., Tignor, M., Poloczanska, E. S., Mintenbeck, K., Alegría, A., Craig, M., Langsdorf, S., Löschke, S., Möller, V., Okem, A., and Rama, B., Cambridge University Press, Cambridge, UK and New York, NY, USA, 121–196,  <ext-link xlink:href="https://doi.org/10.1017/9781009325844.003" ext-link-type="DOI">10.1017/9781009325844.003</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx4"><label>Burton et al.(2024)</label><mixed-citation>Burton, C., Lampe, S., Kelley, D. I., Thiery, W., Hantson, S., Christidis, N., Gudmundsson, L., Forrest, M., Burke, E., Chang, J., Huang, H., Ito, A.,  Kou-Giesbrecht, S., Lasslop, G., Li, W., Nieradzik, L., Li, F., Chen, Y.,  Randerson, J., Reyer, C. P. O., and Mengel, M.: Global burned area  increasingly explained by climate change, Nat. Clim. Change, 14, 1186–1192, <ext-link xlink:href="https://doi.org/10.1038/s41558-024-02140-w" ext-link-type="DOI">10.1038/s41558-024-02140-w</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx5"><label>DateParser contributors(2024)</label><mixed-citation>DateParser contributors: Dateparser – python parser for human readable  dates, GitHub Repository, <uri>https://github.com/scrapinghub/dateparser/tree/master</uri> (last access: 20 May 2026), 2024.</mixed-citation></ref>
      <ref id="bib1.bibx6"><label>de Brito et al.(2020)</label><mixed-citation>de Brito, M. M., Kuhlicke, C., and Marx, A.: Near-real-time drought impact assessment: a text mining approach on the 2018/19 drought in Germany,  Environ. Res. Lett., 15, 1040a9, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/aba4ca" ext-link-type="DOI">10.1088/1748-9326/aba4ca</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx7"><label>de Brito et al.(2024)</label><mixed-citation>de Brito, M. M., Sodoge, J., Fekete, A., Hagenlocher, M., Koks, E., Kuhlicke,  C., Messori, G., de Ruiter, M., Schweizer, P.-J., and Ward, P. J.: Uncovering  the Dynamics of Multi-Sector Impacts of Hydrological Extremes: A Methods  Overview, Earth's Future, 12, e2023EF003906, <ext-link xlink:href="https://doi.org/10.1029/2023EF003906" ext-link-type="DOI">10.1029/2023EF003906</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx8"><label>de Brito et al.(2025)</label><mixed-citation>de Brito, M. M., Sodoge, J., Kreibich, H., and Kuhlicke, C.: Comprehensive assessment of flood socioeconomic impacts through text-mining, Water Resour. Res., 61, e2024WR037813, <ext-link xlink:href="https://doi.org/10.1029/2024WR037813" ext-link-type="DOI">10.1029/2024WR037813</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx9"><label>de Bruijn et al.(2019)</label><mixed-citation>de Bruijn, J. A., de Moel, H., Jongman, B., de Ruiter, M. C., Wagemaker, J.,  and Aerts, J. C.: A global database of historic and real-time flood events  based on social media, Scientific data, 6, 311, <ext-link xlink:href="https://doi.org/10.1038/s41597-019-0326-9" ext-link-type="DOI">10.1038/s41597-019-0326-9</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx10"><label>Delforge et al.(2025)</label><mixed-citation>Delforge, D., Wathelet, V., Below, R., Sofia, C. L., Tonnelier, M., van  Loenhout, J. A., and Speybroeck, N.: EM-DAT: the Emergency Events Database,  Int. J. Disast. Risk Re., 124, 105509, <ext-link xlink:href="https://doi.org/10.1016/j.ijdrr.2025.105509" ext-link-type="DOI">10.1016/j.ijdrr.2025.105509</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx11"><label>d'Errico et al.(2022)</label><mixed-citation>D'Errico, M., Pons, F., Yiou, P., Tao, S., Nardini, C., Lunkeit, F., and Faranda, D.: Present and future synoptic circulation patterns associated with cold and snowy spells over Italy, Earth Syst. Dynam., 13, 961–992, <ext-link xlink:href="https://doi.org/10.5194/esd-13-961-2022" ext-link-type="DOI">10.5194/esd-13-961-2022</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx12"><label>Devlin et al.(2019)</label><mixed-citation>Devlin, J., Chang, M.-W., Lee, K., and Toutanova, K.: BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding, in: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), Association for Computational Linguistics, 4171–4186, <ext-link xlink:href="https://doi.org/10.18653/v1/N19-1423" ext-link-type="DOI">10.18653/v1/N19-1423</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx13"><label>Eberenz et al.(2021)</label><mixed-citation>Eberenz, S., Lüthi, S., and Bresch, D. N.: Regional tropical cyclone impact functions for globally consistent risk assessments, Nat. Hazards Earth Syst. Sci., 21, 393–415, <ext-link xlink:href="https://doi.org/10.5194/nhess-21-393-2021" ext-link-type="DOI">10.5194/nhess-21-393-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx14"><label>Faiella et al.(2020)</label><mixed-citation>Faiella, A., Antofie, T., Luoni, S., Marin Ferrer, M., and Rios Diaz, F.: The  Risk Data Hub loss datasets, Tech. Rep. EUR 30036 EN, Publications Office of  the European Union, Luxembourg, <ext-link xlink:href="https://doi.org/10.2760/488300" ext-link-type="DOI">10.2760/488300</ext-link>, ISBN 978-92-76-14656-8, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx15"><label>Flynn et al.(2025)</label><mixed-citation>Flynn, C. M., Moemken, J., Pinto, J. G., Schutte, M. K., and Messori, G.: CLIMK–WINDS: a new database of extreme European winter windstorms, Earth Syst. Sci. Data, 17, 4431–4453, <ext-link xlink:href="https://doi.org/10.5194/essd-17-4431-2025" ext-link-type="DOI">10.5194/essd-17-4431-2025</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx16"><label>Global Administrative Areas(2012)</label><mixed-citation>Global Administrative Areas: GADM database of Global Administrative Areas, version 2.0, <uri>https://gadm.org/</uri> (last access: 20 May 2026), 2012.</mixed-citation></ref>
      <ref id="bib1.bibx17"><label>Hammond et al.(2015)</label><mixed-citation> Hammond, M. J., Chen, A. S., Djordjević, S., Butler, D., and Mark, O.:  Urban flood impact assessment: A state-of-the-art review, Urban Water J., 12, 14–29, 2015.</mixed-citation></ref>
      <ref id="bib1.bibx18"><label>Harrington and Otto(2020)</label><mixed-citation>Harrington, L. J. and Otto, F. E.: Reconciling theory with the reality of  African heatwaves, Nat. Clim. Change, 10, 796–798, <ext-link xlink:href="https://doi.org/10.1038/s41558-020-0851-8" ext-link-type="DOI">10.1038/s41558-020-0851-8</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx19"><label>Hurlbert et al.(2019)</label><mixed-citation>Hurlbert, M., Krishnaswamy, J., Johnson, F. X., Rodríguez-Morales, J. E., and Zommers, Z.: 7 – Risk management and decision making in relation to  sustainable development, in: Climate Change and Land: An IPCC Special Report on Climate Change, Desertification, Land Degradation, Sustainable Land Management, Food Security, and Greenhouse Gas Fluxes in Terrestrial Ecosystems, edited by: Shukla, P. R., Skea, J., Calvo Buendia, E.,  Masson-Delmotte, V., Pörtner, H.-O., Roberts, D. C., Zhai, P., Slade, R.,  Connors, S., van Diemen, R., Ferrat, M., Haughey, E., Luz, S., Neogi, S.,  Pathak, M., Petzold, J., Portugal Pereira, J., Vyas, P., Huntley, E.,  Kissick, K., Belkacemi, M., and Malley, J., Cambridge University Press, Cambridge, 673–800, <ext-link xlink:href="https://doi.org/10.1017/9781009157988.009" ext-link-type="DOI">10.1017/9781009157988.009</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx20"><label>Jones et al.(2022)</label><mixed-citation>Jones, M. W., Abatzoglou, J. T., Veraverbeke, S., Andela, N., Lasslop, G.,  Forkel, M., Smith, A. J. P., Burton, C., Betts, R. A., van der Werf, G. R.,  Sitch, S., Canadell, J. G., Santín, C., Kolden, C., Doerr, S. H., and  Le Quéré, C.: Global and Regional Trends and Drivers of Fire Under Climate  Change, Rev. Geophys., 60, e2020RG000726, <ext-link xlink:href="https://doi.org/10.1029/2020RG000726" ext-link-type="DOI">10.1029/2020RG000726</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx21"><label>Kreibich et al.(2023)</label><mixed-citation>Kreibich, H., Schröter, K., Di Baldassarre, G., Van Loon, A. F., Mazzoleni, M., Abeshu, G. W., Agafonova, S., AghaKouchak, A., Aksoy, H., Alvarez-Garreton, C., Aznar, B., Balkhi, L., Barendrecht, M. H., Biancamaria, S., Bos-Burgering, L., Bradley, C., Budiyono, Y., Buytaert, W., Capewell, L., Carlson, H., Cavus, Y., Couasnon, A., Coxon, G., Daliakopoulos, I., de Ruiter, M. C., Delus, C., Erfurt, M., Esposito, G., François, D., Frappart, F., Freer, J., Frolova, N., Gain, A. K., Grillakis, M., Grima, J. O., Guzmán, D. A., Huning, L. S., Ionita, M., Kharlamov, M., Khoi, D. N., Kieboom, N., Kireeva, M., Koutroulis, A., Lavado-Casimiro, W., Li, H.-Y., LLasat, M. C., Macdonald, D., Mård, J., Mathew-Richards, H., McKenzie, A., Mejia, A., Mendiondo, E. M., Mens, M., Mobini, S., Mohor, G. S., Nagavciuc, V., Ngo-Duc, T., Nguyen, H. T. T., Nhi, P. T. T., Petrucci, O., Quan, N. H., Quintana-Seguí, P., Razavi, S., Ridolfi, E., Riegel, J., Sadik, M. S., Sairam, N., Savelli, E., Sazonov, A., Sharma, S., Sörensen, J., Souza, F. A. A., Stahl, K., Steinhausen, M., Stoelzle, M., Szalińska, W., Tang, Q., Tian, F., Tokarczyk, T., Tovar, C., Tran, T. V. T., van Huijgevoort, M. H. J., van Vliet, M. T. H., Vorogushyn, S., Wagener, T., Wang, Y., Wendt, D. E., Wickham, E., Yang, L., Zambrano-Bigiarini, M., and Ward, P. J.: Panta Rhei benchmark dataset: socio-hydrological data of paired events of floods and droughts, Earth Syst. Sci. Data, 15, 2009–2023, <ext-link xlink:href="https://doi.org/10.5194/essd-15-2009-2023" ext-link-type="DOI">10.5194/essd-15-2009-2023</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx22"><label>Lange et al.(2020)</label><mixed-citation>Lange, S., Volkholz, J., Geiger, T., Zhao, F., Vega, I., Veldkamp, T., Reyer,  C., Warszawski, L., Huber, V., Jägermeyr, J., Schewe, J., Bresch, D.,  Büchner, M., Chang, J., Ciais, P., Dury, M., Emanuel, K., Folberth, C.,  Gerten, D., and Frieler, K.: Projecting Exposure to Extreme Climate Impact  Events Across Six Event Categories and Three Spatial Scales, Earth's Future,  11, e2020EF001616, <ext-link xlink:href="https://doi.org/10.1029/2020EF001616" ext-link-type="DOI">10.1029/2020EF001616</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx23"><label>Lee et al.(2024)</label><mixed-citation>Lee, R., White, C. J., Adnan, M. S. G., Douglas, J., Mahecha, M. D.,  O'Loughlin, F. E., Patelli, E., Ramos, A. M., Roberts, M. J., Martius, O.,  Tubaldi, E., van den Hurk, B., Ward, P. J., and Zscheischler, J.:  Reclassifying historical disasters: From single to multi-hazards, Sci. Total Environ., 912, 169120, <ext-link xlink:href="https://doi.org/10.1016/j.scitotenv.2023.169120" ext-link-type="DOI">10.1016/j.scitotenv.2023.169120</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx24"><label>Li et al.(2024)</label><mixed-citation>Li, N., Zahra, S., de Brito, M. M., Flynn, C. M., Görnerup, O., Koffi, W., Kurfali, M., Meng, C., Thiery, W., Zscheischler, J., Messori, G., and Nivre, J.: Using LLMs to Build a Database of Climate Extreme Impacts, in: Natural Language Processing meets Climate Change @ ACL 2024,  <uri>https://openreview.net/forum?id=h7o0qyQ0rt</uri> (last access:20 May 2026), 2024.</mixed-citation></ref>
      <ref id="bib1.bibx25"><label>Li et al.(2026a)</label><mixed-citation>Li, N., Thiery, W., Zahra, S., de Brito, M. M., Worou, K., Kurfali, M., Lampe, S., Munoz, P., Flynn, C., Trigoso, C., Nivre, J., Zscheischler, J., and Messori, G.: Wikimpacts – A global climate impact database based on  automated information extraction from Wikipedia, Version 1.0.final, Bolin Centre Database [data set],  <ext-link xlink:href="https://doi.org/10.17043/li-2025-wikimpacts-1.0.final" ext-link-type="DOI">10.17043/li-2025-wikimpacts-1.0.final</ext-link>, 2026a.</mixed-citation></ref>
      <ref id="bib1.bibx26"><label>Li et al.(2026b)</label><mixed-citation>Li, N., Zahra, S., Worou, K., Kurfali, M., Görnerup, O., Nivre, J., and  Messori, G.: VUB-HYDR/Wikimpacts: Wikimpacts v1.0.final, Version v1.0.final, Zenodo [code/data set], <ext-link xlink:href="https://doi.org/10.5281/zenodo.19428787" ext-link-type="DOI">10.5281/zenodo.19428787</ext-link>, 2026b.</mixed-citation></ref>
      <ref id="bib1.bibx27"><label>Lindersson and Messori(2025)</label><mixed-citation>Lindersson, S. and Messori, G.: SHEDIS-Temperature: linking temperature-related disaster impacts to subnational data on meteorology and human exposure, Earth Syst. Sci. Data, 17, 6379–6403, <ext-link xlink:href="https://doi.org/10.5194/essd-17-6379-2025" ext-link-type="DOI">10.5194/essd-17-6379-2025</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx28"><label>Lüthi et al.(2021)</label><mixed-citation>Lüthi, S., Aznar-Siguan, G., Fairless, C., and Bresch, D. N.: Globally consistent assessment of economic impacts of wildfires in CLIMADA v2.2, Geosci. Model Dev., 14, 7175–7187, <ext-link xlink:href="https://doi.org/10.5194/gmd-14-7175-2021" ext-link-type="DOI">10.5194/gmd-14-7175-2021</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx29"><label>Mithal et al.(2024)</label><mixed-citation>Mithal, V., Sillmann, J., and Zscheischler, J.: Linking regional economic  impacts of temperature-related disasters to underlying climatic hazards,  Environ. Res. Lett., 19, 124010, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/ad89de" ext-link-type="DOI">10.1088/1748-9326/ad89de</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx30"><label>Moemken et al.(2024)</label><mixed-citation>Moemken, J., Messori, G., and Pinto, J. G.: Windstorm losses in Europe–What to gain from damage datasets, Weather and Climate Extremes, 44, 100661, <ext-link xlink:href="https://doi.org/10.1016/j.wace.2024.100661" ext-link-type="DOI">10.1016/j.wace.2024.100661</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx31"><label>Mora et al.(2017)</label><mixed-citation>Mora, C., Dousset, B., Caldwell, I. R., Powell, F. E., Geronimo, R. C., Bielecki, C. R., Counsell, C. W. W., Dietrich, B. S., Johnston, E. T., Louis, L. V., Lucas, M. P., McKenzie, M. M., Shea, A. G., Tseng, H., Giambelluca, T. W., Leon, Lisa R., Hawkins, E., and Trauernicht, C.: Global risk of deadly heat, Nat. Clim. Change, 7, 501–506, <ext-link xlink:href="https://doi.org/10.1038/nclimate3322" ext-link-type="DOI">10.1038/nclimate3322</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx32"><label>Muheki et al.(2024)</label><mixed-citation>Muheki, D., Deijns, A. A. J., Bevacqua, E., Messori, G., Zscheischler, J., and Thiery, W.: The perfect storm? Co-occurring climate extremes in East Africa, Earth Syst. Dynam., 15, 429–466, <ext-link xlink:href="https://doi.org/10.5194/esd-15-429-2024" ext-link-type="DOI">10.5194/esd-15-429-2024</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx33"><label>OpenAI(2024)</label><mixed-citation>OpenAI: Gpt-4o system card,   <uri>https://cdn.openai.com/gpt-4o-system-card.pdf</uri> (last access: 20 May 2026), 2024.</mixed-citation></ref>
      <ref id="bib1.bibx34"><label>OpenStreetMap contributors(2017a)</label><mixed-citation>OpenStreetMap contributors: Planet dump,  <uri>https://www.openstreetmap.org</uri> (last access: 20 May 2026), 2017a.</mixed-citation></ref>
      <ref id="bib1.bibx35"><label>OpenStreetMap contributors(2017b)</label><mixed-citation>OpenStreetMap contributors: TMC/Location Code List/Location Types,  <uri>https://wiki.openstreetmap.org/wiki/TMC/Location_Code_List/Location_Types</uri> (last access: 20 May 2026),  2017b.</mixed-citation></ref>
      <ref id="bib1.bibx36"><label>Panwar and Sen(2019)</label><mixed-citation> Panwar, V. and Sen, S.: Economic impact of natural disasters: An empirical  re-examination, Margin: The Journal of Applied Economic Research, 13,  109–139, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx37"><label>Panwar and Sen(2020)</label><mixed-citation> Panwar, V. and Sen, S.: Disaster damage records of EM-DAT and DesInventar: a  systematic comparison, Economics of Disasters and Climate Change, 4,  295–317, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx38"><label>Papagiannaki et al.(2022)</label><mixed-citation>Papagiannaki, K., Petrucci, O., Diakakis, M., Kotroni, V., Aceto, L., Bianchi, C., Brázdil, R., Gelabert, M. G., Inbar, M., Kahraman, A., Özgenur   Kılıç, Krahn, A., Kreibich, H., Llasat, M. C., Llasat-Botija, M.,   Macdonald, N., de Brito, M. M., Mercuri, M., Pereira, S., Řehoř, J., Geli,   J. R., Salvati, P., Vinet, F., and Zêzere, J. L.: Developing a large-scale   dataset of flood fatalities for territories in the Euro-Mediterranean region,   FFEM-DB, Scientific Data, 9, 166, <ext-link xlink:href="https://doi.org/10.1038/s41597-022-01273-x" ext-link-type="DOI">10.1038/s41597-022-01273-x</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bibx39"><label>Paprotny et al.(2024)</label><mixed-citation>Paprotny, D., Terefenko, P., and Śledziowski, J.: HANZE v2.1: an improved database of flood impacts in Europe from 1870 to 2020, Earth Syst. Sci. Data, 16, 5145–5170, <ext-link xlink:href="https://doi.org/10.5194/essd-16-5145-2024" ext-link-type="DOI">10.5194/essd-16-5145-2024</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx40"><label>Rosvold and Buhaug(2021)</label><mixed-citation>Rosvold, E. L. and Buhaug, H.: GDIS, a global dataset of geocoded disaster  locations, Scientific data, 8, 61, <ext-link xlink:href="https://doi.org/10.1038/s41597-021-00846-6" ext-link-type="DOI">10.1038/s41597-021-00846-6</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx41"><label>Sanh et al.(2019)</label><mixed-citation>Sanh, V., Debut, L., Chaumond, J., and Wolf, T.: DistilBERT, a distilled  version of BERT: smaller, faster, cheaper and lighter, arXiv [preprint], <ext-link xlink:href="https://doi.org/10.48550/arXiv.1910.01108" ext-link-type="DOI">10.48550/arXiv.1910.01108</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bibx42"><label>Seneviratne et al.(2021)</label><mixed-citation>Seneviratne, S., Zhang, X., Adnan, M., Badi, W., Dereczynski, C., Di Luca, A., Ghosh, S., Iskandar, I., Kossin, J., Lewis, S., Otto, F., Pinto, I., Satoh, M., Vicente-Serrano, S., Wehner, M., and Zhou, B.: Weather and Climate  Extreme Events in a Changing Climate, Cambridge University Press, Cambridge, United Kingdom and New York, NY, USA, 1513–1766,   <ext-link xlink:href="https://doi.org/10.1017/9781009157896.013" ext-link-type="DOI">10.1017/9781009157896.013</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx43"><label>Sodoge et al.(2023)</label><mixed-citation>Sodoge, J., Kuhlicke, C., and de Brito, M. M.: Automatized spatio-temporal  detection of drought impacts from newspaper articles using natural language  processing and machine learning, Weather and Climate Extremes, 41, 100574, <ext-link xlink:href="https://doi.org/10.1016/j.wace.2023.100574" ext-link-type="DOI">10.1016/j.wace.2023.100574</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bibx44"><label>Stahl et al.(2016)</label><mixed-citation>Stahl, K., Kohn, I., Blauhut, V., Urquijo, J., De Stefano, L., Acácio, V., Dias, S., Stagge, J. H., Tallaksen, L. M., Kampragou, E., Van Loon, A. F., Barker, L. J., Melsen, L. A., Bifulco, C., Musolino, D., de Carli, A., Massarutto, A., Assimacopoulos, D., and Van Lanen, H. A. J.: Impacts of European drought events: insights from an international database of text-based reports, Nat. Hazards Earth Syst. Sci., 16, 801–819, <ext-link xlink:href="https://doi.org/10.5194/nhess-16-801-2016" ext-link-type="DOI">10.5194/nhess-16-801-2016</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bibx45"><label>Teber et al.(2025)</label><mixed-citation>Teber, K., Weynants, M., Gans, F., and Mahecha, M. D.: Geo-Disasters: Geocoding climate-related events in the international disaster database EM-DAT, Big Earth Data, 10, 303–318, <ext-link xlink:href="https://doi.org/10.1080/20964471.2025.2576274" ext-link-type="DOI">10.1080/20964471.2025.2576274</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx46"><label>Thiery et al.(2017)</label><mixed-citation>Thiery, W., Gudmundsson, L., Bedka, K., Semazzi, F. H., Lhermitte, S., Willems, P., van Lipzig, N. P., and Seneviratne, S. I.: Early warnings of hazardous thunderstorms over Lake Victoria, Environ. Res. Lett., 12, 074012, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/aa7521" ext-link-type="DOI">10.1088/1748-9326/aa7521</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bibx47"><label>Thiery et al.(2021)</label><mixed-citation>Thiery, W., Lange, S., Rogelj, J., Schleussner, C.-F., Gudmundsson, L.,  Seneviratne, S. I., Andrijevic, M., Frieler, K., Emanuel, K., Geiger, T.,  Bresch, D. N., Zhao, F., Willner, S. N., Büchner, M., Volkholz, J., Bauer,  N., Chang, J., Ciais, P., Dury, M., François, L., Grillakis, M., Gosling,  S. N., Hanasaki, N., Hickler, T., Huber, V., Ito, A., Jägermeyr, J.,  Khabarov, N., Koutroulis, A., Liu, W., Lutz, W., Mengel, M., Müller, C.,  Ostberg, S., Reyer, C. P. O., Stacke, T., and Wada, Y.: Intergenerational  inequities in exposure to climate extremes, Science, 374, 158–160,  <ext-link xlink:href="https://doi.org/10.1126/science.abi7339" ext-link-type="DOI">10.1126/science.abi7339</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bibx48"><label>Tonmoy et al.(2024)</label><mixed-citation>Tonmoy, S. M. T. I., Zaman, S. M. M., Jain, V., Rani, A., Rawte, V., Chadha,  A., and Das, A.: A Comprehensive Survey of Hallucination Mitigation  Techniques in Large Language Models, arXiv [preprint],  <ext-link xlink:href="https://doi.org/10.48550/arXiv.2401.01313" ext-link-type="DOI">10.48550/arXiv.2401.01313</ext-link>, 2024.</mixed-citation></ref>
      <ref id="bib1.bibx49"><label>Tschumi and Zscheischler(2020)</label><mixed-citation> Tschumi, E. and Zscheischler, J.: Countrywide climate features during recorded climate-related disasters, Climatic Change, 158, 593–609, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx50"><label>UNISDR(2024)</label><mixed-citation>UNISDR: DesInventar: United Nations Office for Disaster Risk Reduction,  <uri>https://www.desinventar.net/</uri> (last access: May 2024), 2024.</mixed-citation></ref>
      <ref id="bib1.bibx51"><label>Wikipedia contributors(2024a)</label><mixed-citation>Wikipedia contributors: 1939 Pacific hurricane season – Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=1939_Pacific_hurricane_season&amp;oldid=1224891091</uri>, (last access: 26 January 2026), 2024a.</mixed-citation></ref>
      <ref id="bib1.bibx52"><label>Wikipedia contributors(2024b)</label><mixed-citation>Wikipedia contributors: Hurricane Nate (2005) – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Hurricane_Nate_(2005)&amp;oldid=1249615441</uri>, (last access: 30 January 2026), 2024b.</mixed-citation></ref>
      <ref id="bib1.bibx53"><label>Wikipedia contributors(2025a)</label><mixed-citation>Wikipedia contributors: 2015 Russian wildfires – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=2015_Russian_wildfires&amp;oldid=1293003396</uri>, (last access: 26 January 2026), 2025a.</mixed-citation></ref>
      <ref id="bib1.bibx54"><label>Wikipedia contributors(2025b)</label><mixed-citation>Wikipedia contributors: 2017 Tulsa tornadoes – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=2017_Tulsa_tornadoes&amp;oldid=1296198946</uri>, (last access: 26 January 2026), 2025b.</mixed-citation></ref>
      <ref id="bib1.bibx55"><label>Wikipedia contributors(2025c)</label><mixed-citation>Wikipedia contributors: 1999 Blayais Nuclear Power Plant flood – Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=1999_Blayais_Nuclear_Power_Plant_flood&amp;oldid=1309899681</uri>, (last access: 26 January 2026), 2025c.</mixed-citation></ref>
      <ref id="bib1.bibx56"><label>Wikipedia contributors(2025d)</label><mixed-citation>Wikipedia contributors: 2011 European floods – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=2011_European_floods&amp;oldid=1310685507</uri>, (last access: 26 January 2026), 2025d.</mixed-citation></ref>
      <ref id="bib1.bibx57"><label>Wikipedia contributors(2025e)</label><mixed-citation>Wikipedia contributors: Hurricane Larry – Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Hurricane_Larry&amp;oldid=1315207889</uri>, (last access: 30 January 2026), 2025e.</mixed-citation></ref>
      <ref id="bib1.bibx58"><label>Wikipedia contributors(2025f)</label><mixed-citation>Wikipedia contributors: List of Nicaragua hurricanes – Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=List_of_Nicaragua_hurricanes&amp;oldid=1319005054</uri>, (last access: 9 April 2026), 2025f.</mixed-citation></ref>
      <ref id="bib1.bibx59"><label>Wikipedia contributors(2025g)</label><mixed-citation>Wikipedia contributors: Cyclone Vayu – Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Cyclone_Vayu&amp;oldid=1320664862</uri>, (last access: 30 January 2026), 2025g.</mixed-citation></ref>
      <ref id="bib1.bibx60"><label>Wikipedia contributors(2025h)</label><mixed-citation>Wikipedia contributors: Typhoon Kate – Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Typhoon_Kate&amp;oldid=1321753937</uri>, (last access: 26 January 2026), 2025h.</mixed-citation></ref>
      <ref id="bib1.bibx61"><label>Wikipedia contributors(2025i)</label><mixed-citation>Wikipedia contributors: Typhoons in Taiwan – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Typhoons_in_Taiwan&amp;oldid=1322603935</uri>, (last access: 9 April 2026), 2025i.</mixed-citation></ref>
      <ref id="bib1.bibx62"><label>Wikipedia contributors(2025j)</label><mixed-citation>Wikipedia contributors: Tropical cyclones in 2013 – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Tropical_cyclones_in_2013&amp;oldid=1325283599</uri>, (last access: 26 January 2026), 2025j.</mixed-citation></ref>
      <ref id="bib1.bibx63"><label>Wikipedia contributors(2026a)</label><mixed-citation>Wikipedia contributors: 1983–1985 famine in Ethiopia – Wikipedia, The Free Encyclopedia, <uri>https://en.wikipedia.org/w/index.php?title=1983-1985_famine_in_Ethiopia&amp;oldid=1332375726</uri>, (last access: 30 January 2026), 2026a. </mixed-citation></ref>
      <ref id="bib1.bibx64"><label>Wikipedia contributors(2026b)</label><mixed-citation>Wikipedia contributors: 2021 European floods – Wikipedia, The Free   Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=2021_European_floods&amp;oldid=1333089008</uri>, (last access: 26 January 2026), 2026b.</mixed-citation></ref>
      <ref id="bib1.bibx65"><label>Wikipedia contributors(2026c)</label><mixed-citation>Wikipedia contributors: Hurricane Ida – Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Hurricane_Ida&amp;oldid=1333487396</uri>, (last access: 30 January 2026), 2026c.</mixed-citation></ref>
      <ref id="bib1.bibx66"><label>Wikipedia contributors(2026d)</label><mixed-citation>Wikipedia contributors: Miami Hurricanes football – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Miami_Hurricanes_football&amp;oldid=1334196783</uri>, (last access: 30 January 2026), 2026d.</mixed-citation></ref>
      <ref id="bib1.bibx67"><label>Wikipedia contributors(2026e)</label><mixed-citation>Wikipedia contributors: 2021 Atlantic hurricane season – Wikipedia, The  Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=2021_Atlantic_hurricane_season&amp;oldid=1335534205</uri>, (last access: 30 January 2026), 2026e.</mixed-citation></ref>
      <ref id="bib1.bibx68"><label>Wikipedia contributors(2026f)</label><mixed-citation>Wikipedia contributors: Typhoon Talim (2017) – Wikipedia, The Free  Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Typhoon_Talim_(2017)&amp;oldid=1336967505</uri>, (last access: 9 April 2026), 2026f.</mixed-citation></ref>
      <ref id="bib1.bibx69"><label>Wikipedia contributors(2026g)</label><mixed-citation>Wikipedia contributors: Lists of tornadoes and tornado outbreaks –   Wikipedia, The Free Encyclopedia,  <uri>https://en.wikipedia.org/w/index.php?title=Lists_of_tornadoes_and_tornado_outbreaks&amp;oldid=1343462266</uri>, (last access: 9 April 2026), 2026g.</mixed-citation></ref>
      <ref id="bib1.bibx70"><label>Worou and Messori(2025)</label><mixed-citation>Worou, K. and Messori, G.: Compounding droughts and floods amplify  socio-economic impacts, Environ. Res. Lett., 20, 104024, <ext-link xlink:href="https://doi.org/10.1088/1748-9326/adfe82" ext-link-type="DOI">10.1088/1748-9326/adfe82</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bibx71"><label>Zommers et al.(2020)</label><mixed-citation>Zommers, Z., Marbaix, P., Fischlin, A., Ibrahim, Z. Z., Grant, S., Magnan,  A. K., Pörtner, H.-O., Howden, M., Calvin, K., Warner, K., Thiery, W.,  Sebesvari, Z., Davin, E. L., Evans, J. P., Rosenzweig, C., O’Neill, B. C.,  Patwardhan, A., Warren, R., van Aalst, M. K., and Hulbert, M.: Burning  embers: towards more transparent and robust climate-change risk assessments,  Nature Reviews Earth &amp; Environment, 1, 516–529,  <ext-link xlink:href="https://doi.org/10.1038/s43017-020-0088-0" ext-link-type="DOI">10.1038/s43017-020-0088-0</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bibx72"><label>Zscheischler and Seneviratne(2017)</label><mixed-citation>Zscheischler, J. and Seneviratne, S. I.: Dependence of drivers affects risks  associated with compound events, Science Advances, 3, e1700263, <ext-link xlink:href="https://doi.org/10.1126/sciadv.1700263" ext-link-type="DOI">10.1126/sciadv.1700263</ext-link>, 2017.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>Wikimpacts 1.0: a new global climate impact database based on automated information extraction from Wikipedia</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>Alencar et al.(2024)</label><mixed-citation>
      
Alencar, P. H., Sodoge, J., Paton, E., and Madruga de Brito, M.: Flash droughts and their impacts–using newspaper articles to assess the perceived  consequences of rapidly emerging droughts, Environ. Res. Lett., 19, 074048,
<a href="https://doi.org/10.1088/1748-9326/ad58fa" target="_blank">https://doi.org/10.1088/1748-9326/ad58fa</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>Antweiler(2026)</label><mixed-citation>
      
Antweiler, W.: PACIFIC Exchange Rate Service, University of British Columbia,
Sauder School of Business, <a href="https://fx.sauder.ubc.ca" target="_blank"/> (last access: 20 May 2026), 2026.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>Begum et al.(2022)</label><mixed-citation>
      
Begum, R. A., Lempert, R., Ali, E., Benjaminsen, T. A., Bernauer, T., Cramer, W., Cui, X., Mach, K., Nagy, G., Stenseth, N. C., Sukumar, R., and Wester, P.: Point of Departure and Key Concepts, in: Climate Change 2022: Impacts, Adaptation and Vulnerability. Contribution of Working Group II to  the Sixth Assessment Report of the Intergovernmental Panel on Climate Change, edited by: Pörtner, H.-O., Roberts, D. C., Tignor, M., Poloczanska, E. S., Mintenbeck, K., Alegría, A., Craig, M., Langsdorf, S., Löschke, S., Möller, V., Okem, A., and Rama, B., Cambridge University Press, Cambridge, UK and New York, NY, USA, 121–196,  <a href="https://doi.org/10.1017/9781009325844.003" target="_blank">https://doi.org/10.1017/9781009325844.003</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>Burton et al.(2024)</label><mixed-citation>
      
Burton, C., Lampe, S., Kelley, D. I., Thiery, W., Hantson, S., Christidis, N., Gudmundsson, L., Forrest, M., Burke, E., Chang, J., Huang, H., Ito, A.,  Kou-Giesbrecht, S., Lasslop, G., Li, W., Nieradzik, L., Li, F., Chen, Y.,  Randerson, J., Reyer, C. P. O., and Mengel, M.: Global burned area  increasingly explained by climate change, Nat. Clim. Change, 14, 1186–1192, <a href="https://doi.org/10.1038/s41558-024-02140-w" target="_blank">https://doi.org/10.1038/s41558-024-02140-w</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>DateParser contributors(2024)</label><mixed-citation>
      
DateParser contributors: Dateparser – python parser for human readable  dates, GitHub Repository, <a href="https://github.com/scrapinghub/dateparser/tree/master" target="_blank"/> (last access: 20 May 2026), 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>de Brito et al.(2020)</label><mixed-citation>
      
de Brito, M. M., Kuhlicke, C., and Marx, A.: Near-real-time drought impact assessment: a text mining approach on the 2018/19 drought in Germany,  Environ. Res. Lett., 15, 1040a9, <a href="https://doi.org/10.1088/1748-9326/aba4ca" target="_blank">https://doi.org/10.1088/1748-9326/aba4ca</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>de Brito et al.(2024)</label><mixed-citation>
      
de Brito, M. M., Sodoge, J., Fekete, A., Hagenlocher, M., Koks, E., Kuhlicke,  C., Messori, G., de Ruiter, M., Schweizer, P.-J., and Ward, P. J.: Uncovering  the Dynamics of Multi-Sector Impacts of Hydrological Extremes: A Methods  Overview, Earth's Future, 12, e2023EF003906, <a href="https://doi.org/10.1029/2023EF003906" target="_blank">https://doi.org/10.1029/2023EF003906</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>de Brito et al.(2025)</label><mixed-citation>
      
de Brito, M. M., Sodoge, J., Kreibich, H., and Kuhlicke, C.: Comprehensive assessment of flood socioeconomic impacts through text-mining, Water Resour. Res., 61, e2024WR037813, <a href="https://doi.org/10.1029/2024WR037813" target="_blank">https://doi.org/10.1029/2024WR037813</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>de Bruijn et al.(2019)</label><mixed-citation>
      
de Bruijn, J. A., de Moel, H., Jongman, B., de Ruiter, M. C., Wagemaker, J.,  and Aerts, J. C.: A global database of historic and real-time flood events  based on social media, Scientific data, 6, 311, <a href="https://doi.org/10.1038/s41597-019-0326-9" target="_blank">https://doi.org/10.1038/s41597-019-0326-9</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>Delforge et al.(2025)</label><mixed-citation>
      
Delforge, D., Wathelet, V., Below, R., Sofia, C. L., Tonnelier, M., van  Loenhout, J. A., and Speybroeck, N.: EM-DAT: the Emergency Events Database,  Int. J. Disast. Risk Re., 124, 105509, <a href="https://doi.org/10.1016/j.ijdrr.2025.105509" target="_blank">https://doi.org/10.1016/j.ijdrr.2025.105509</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>d'Errico et al.(2022)</label><mixed-citation>
      
D'Errico, M., Pons, F., Yiou, P., Tao, S., Nardini, C., Lunkeit, F., and Faranda, D.: Present and future synoptic circulation patterns associated with cold and snowy spells over Italy, Earth Syst. Dynam., 13, 961–992, <a href="https://doi.org/10.5194/esd-13-961-2022" target="_blank">https://doi.org/10.5194/esd-13-961-2022</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>Devlin et al.(2019)</label><mixed-citation>
      
Devlin, J., Chang, M.-W., Lee, K., and Toutanova, K.: BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding, in:
Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), Association for Computational Linguistics, 4171–4186, <a href="https://doi.org/10.18653/v1/N19-1423" target="_blank">https://doi.org/10.18653/v1/N19-1423</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>Eberenz et al.(2021)</label><mixed-citation>
      
Eberenz, S., Lüthi, S., and Bresch, D. N.: Regional tropical cyclone impact functions for globally consistent risk assessments, Nat. Hazards Earth Syst. Sci., 21, 393–415, <a href="https://doi.org/10.5194/nhess-21-393-2021" target="_blank">https://doi.org/10.5194/nhess-21-393-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>Faiella et al.(2020)</label><mixed-citation>
      
Faiella, A., Antofie, T., Luoni, S., Marin Ferrer, M., and Rios Diaz, F.: The  Risk Data Hub loss datasets, Tech. Rep. EUR 30036 EN, Publications Office of  the European Union, Luxembourg, <a href="https://doi.org/10.2760/488300" target="_blank">https://doi.org/10.2760/488300</a>, ISBN&thinsp;978-92-76-14656-8, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>Flynn et al.(2025)</label><mixed-citation>
      
Flynn, C. M., Moemken, J., Pinto, J. G., Schutte, M. K., and Messori, G.: CLIMK–WINDS: a new database of extreme European winter windstorms, Earth Syst. Sci. Data, 17, 4431–4453, <a href="https://doi.org/10.5194/essd-17-4431-2025" target="_blank">https://doi.org/10.5194/essd-17-4431-2025</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>Global Administrative Areas(2012)</label><mixed-citation>
      
Global Administrative Areas: GADM database of Global Administrative Areas, version 2.0, <a href="https://gadm.org/" target="_blank"/> (last access: 20 May 2026), 2012.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>Hammond et al.(2015)</label><mixed-citation>
      
Hammond, M. J., Chen, A. S., Djordjević, S., Butler, D., and Mark, O.:  Urban flood impact assessment: A state-of-the-art review, Urban Water J., 12, 14–29, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>Harrington and Otto(2020)</label><mixed-citation>
      
Harrington, L. J. and Otto, F. E.: Reconciling theory with the reality of  African heatwaves, Nat. Clim. Change, 10, 796–798, <a href="https://doi.org/10.1038/s41558-020-0851-8" target="_blank">https://doi.org/10.1038/s41558-020-0851-8</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>Hurlbert et al.(2019)</label><mixed-citation>
      
Hurlbert, M., Krishnaswamy, J., Johnson, F. X., Rodríguez-Morales, J. E., and Zommers, Z.: 7 – Risk management and decision making in relation to  sustainable development, in: Climate Change and Land: An IPCC Special Report on Climate Change, Desertification, Land Degradation, Sustainable Land Management, Food Security, and Greenhouse Gas Fluxes in Terrestrial Ecosystems, edited by: Shukla, P. R., Skea, J., Calvo Buendia, E.,  Masson-Delmotte, V., Pörtner, H.-O., Roberts, D. C., Zhai, P., Slade, R.,  Connors, S., van Diemen, R., Ferrat, M., Haughey, E., Luz, S., Neogi, S.,  Pathak, M., Petzold, J., Portugal Pereira, J., Vyas, P., Huntley, E.,  Kissick, K., Belkacemi, M., and Malley, J., Cambridge University Press, Cambridge, 673–800, <a href="https://doi.org/10.1017/9781009157988.009" target="_blank">https://doi.org/10.1017/9781009157988.009</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>Jones et al.(2022)</label><mixed-citation>
      
Jones, M. W., Abatzoglou, J. T., Veraverbeke, S., Andela, N., Lasslop, G.,  Forkel, M., Smith, A. J. P., Burton, C., Betts, R. A., van der Werf, G. R.,  Sitch, S., Canadell, J. G., Santín, C., Kolden, C., Doerr, S. H., and  Le Quéré, C.: Global and Regional Trends and Drivers of Fire Under Climate  Change, Rev. Geophys., 60, e2020RG000726, <a href="https://doi.org/10.1029/2020RG000726" target="_blank">https://doi.org/10.1029/2020RG000726</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>Kreibich et al.(2023)</label><mixed-citation>
      
Kreibich, H., Schröter, K., Di Baldassarre, G., Van Loon, A. F., Mazzoleni, M., Abeshu, G. W., Agafonova, S., AghaKouchak, A., Aksoy, H., Alvarez-Garreton, C., Aznar, B., Balkhi, L., Barendrecht, M. H., Biancamaria, S., Bos-Burgering, L., Bradley, C., Budiyono, Y., Buytaert, W., Capewell, L., Carlson, H., Cavus, Y., Couasnon, A., Coxon, G., Daliakopoulos, I., de Ruiter, M. C., Delus, C., Erfurt, M., Esposito, G., François, D., Frappart, F., Freer, J., Frolova, N., Gain, A. K., Grillakis, M., Grima, J. O., Guzmán, D. A., Huning, L. S., Ionita, M., Kharlamov, M., Khoi, D. N., Kieboom, N., Kireeva, M., Koutroulis, A., Lavado-Casimiro, W., Li, H.-Y., LLasat, M. C., Macdonald, D., Mård, J., Mathew-Richards, H., McKenzie, A., Mejia, A., Mendiondo, E. M., Mens, M., Mobini, S., Mohor, G. S., Nagavciuc, V., Ngo-Duc, T., Nguyen, H. T. T., Nhi, P. T. T., Petrucci, O., Quan, N. H., Quintana-Seguí, P., Razavi, S., Ridolfi, E., Riegel, J., Sadik, M. S., Sairam, N., Savelli, E., Sazonov, A., Sharma, S., Sörensen, J., Souza, F. A. A., Stahl, K., Steinhausen, M., Stoelzle, M., Szalińska, W., Tang, Q., Tian, F., Tokarczyk, T., Tovar, C., Tran, T. V. T., van Huijgevoort, M. H. J., van Vliet, M. T. H., Vorogushyn, S., Wagener, T., Wang, Y., Wendt, D. E., Wickham, E., Yang, L., Zambrano-Bigiarini, M., and Ward, P. J.: Panta Rhei benchmark dataset: socio-hydrological data of paired events of floods and droughts, Earth Syst. Sci. Data, 15, 2009–2023, <a href="https://doi.org/10.5194/essd-15-2009-2023" target="_blank">https://doi.org/10.5194/essd-15-2009-2023</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>Lange et al.(2020)</label><mixed-citation>
      
Lange, S., Volkholz, J., Geiger, T., Zhao, F., Vega, I., Veldkamp, T., Reyer,  C., Warszawski, L., Huber, V., Jägermeyr, J., Schewe, J., Bresch, D.,  Büchner, M., Chang, J., Ciais, P., Dury, M., Emanuel, K., Folberth, C.,  Gerten, D., and Frieler, K.: Projecting Exposure to Extreme Climate Impact  Events Across Six Event Categories and Three Spatial Scales, Earth's Future,  11, e2020EF001616, <a href="https://doi.org/10.1029/2020EF001616" target="_blank">https://doi.org/10.1029/2020EF001616</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>Lee et al.(2024)</label><mixed-citation>
      
Lee, R., White, C. J., Adnan, M. S. G., Douglas, J., Mahecha, M. D.,  O'Loughlin, F. E., Patelli, E., Ramos, A. M., Roberts, M. J., Martius, O.,  Tubaldi, E., van den Hurk, B., Ward, P. J., and Zscheischler, J.:  Reclassifying historical disasters: From single to multi-hazards, Sci. Total Environ., 912, 169120, <a href="https://doi.org/10.1016/j.scitotenv.2023.169120" target="_blank">https://doi.org/10.1016/j.scitotenv.2023.169120</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>Li et al.(2024)</label><mixed-citation>
      
Li, N., Zahra, S., de Brito, M. M., Flynn, C. M., Görnerup, O., Koffi, W., Kurfali, M., Meng, C., Thiery, W., Zscheischler, J., Messori, G., and Nivre, J.: Using LLMs to Build a Database of Climate Extreme Impacts, in: Natural Language Processing meets Climate Change @ ACL 2024,  <a href="https://openreview.net/forum?id=h7o0qyQ0rt" target="_blank"/> (last access:20 May 2026), 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>Li et al.(2026a)</label><mixed-citation>
      
Li, N., Thiery, W., Zahra, S., de Brito, M. M., Worou, K., Kurfali, M., Lampe, S., Munoz, P., Flynn, C., Trigoso, C., Nivre, J., Zscheischler, J., and Messori, G.: Wikimpacts – A global climate impact database based on  automated information extraction from Wikipedia, Version 1.0.final, Bolin Centre Database [data set],  <a href="https://doi.org/10.17043/li-2025-wikimpacts-1.0.final" target="_blank">https://doi.org/10.17043/li-2025-wikimpacts-1.0.final</a>, 2026a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>Li et al.(2026b)</label><mixed-citation>
      
Li, N., Zahra, S., Worou, K., Kurfali, M., Görnerup, O., Nivre, J., and  Messori, G.: VUB-HYDR/Wikimpacts: Wikimpacts v1.0.final, Version v1.0.final, Zenodo [code/data set], <a href="https://doi.org/10.5281/zenodo.19428787" target="_blank">https://doi.org/10.5281/zenodo.19428787</a>, 2026b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>Lindersson and Messori(2025)</label><mixed-citation>
      
Lindersson, S. and Messori, G.: SHEDIS-Temperature: linking temperature-related disaster impacts to subnational data on meteorology and human exposure, Earth Syst. Sci. Data, 17, 6379–6403, <a href="https://doi.org/10.5194/essd-17-6379-2025" target="_blank">https://doi.org/10.5194/essd-17-6379-2025</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>Lüthi et al.(2021)</label><mixed-citation>
      
Lüthi, S., Aznar-Siguan, G., Fairless, C., and Bresch, D. N.: Globally consistent assessment of economic impacts of wildfires in CLIMADA v2.2, Geosci. Model Dev., 14, 7175–7187, <a href="https://doi.org/10.5194/gmd-14-7175-2021" target="_blank">https://doi.org/10.5194/gmd-14-7175-2021</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>Mithal et al.(2024)</label><mixed-citation>
      
Mithal, V., Sillmann, J., and Zscheischler, J.: Linking regional economic  impacts of temperature-related disasters to underlying climatic hazards,  Environ. Res. Lett., 19, 124010, <a href="https://doi.org/10.1088/1748-9326/ad89de" target="_blank">https://doi.org/10.1088/1748-9326/ad89de</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>Moemken et al.(2024)</label><mixed-citation>
      
Moemken, J., Messori, G., and Pinto, J. G.: Windstorm losses in Europe–What to gain from damage datasets, Weather and Climate Extremes, 44, 100661, <a href="https://doi.org/10.1016/j.wace.2024.100661" target="_blank">https://doi.org/10.1016/j.wace.2024.100661</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>Mora et al.(2017)</label><mixed-citation>
      
Mora, C., Dousset, B., Caldwell, I. R., Powell, F. E., Geronimo, R. C., Bielecki, C. R., Counsell, C. W. W., Dietrich, B. S., Johnston, E. T., Louis, L. V., Lucas, M. P., McKenzie, M. M., Shea, A. G., Tseng, H., Giambelluca, T. W., Leon, Lisa R., Hawkins, E., and Trauernicht, C.: Global risk of deadly heat, Nat. Clim. Change, 7, 501–506, <a href="https://doi.org/10.1038/nclimate3322" target="_blank">https://doi.org/10.1038/nclimate3322</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>Muheki et al.(2024)</label><mixed-citation>
      
Muheki, D., Deijns, A. A. J., Bevacqua, E., Messori, G., Zscheischler, J., and Thiery, W.: The perfect storm? Co-occurring climate extremes in East Africa, Earth Syst. Dynam., 15, 429–466, <a href="https://doi.org/10.5194/esd-15-429-2024" target="_blank">https://doi.org/10.5194/esd-15-429-2024</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>OpenAI(2024)</label><mixed-citation>
      
OpenAI: Gpt-4o system card,   <a href="https://cdn.openai.com/gpt-4o-system-card.pdf" target="_blank"/> (last access: 20 May 2026), 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>OpenStreetMap contributors(2017a)</label><mixed-citation>
      
OpenStreetMap contributors: Planet dump,  <a href="https://www.openstreetmap.org" target="_blank"/> (last access: 20 May 2026), 2017a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>OpenStreetMap contributors(2017b)</label><mixed-citation>
      
OpenStreetMap contributors: TMC/Location Code List/Location Types,  <a href="https://wiki.openstreetmap.org/wiki/TMC/Location_Code_List/Location_Types" target="_blank"/> (last access: 20 May 2026),  2017b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>Panwar and Sen(2019)</label><mixed-citation>
      
Panwar, V. and Sen, S.: Economic impact of natural disasters: An empirical  re-examination, Margin: The Journal of Applied Economic Research, 13,  109–139, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>Panwar and Sen(2020)</label><mixed-citation>
      
Panwar, V. and Sen, S.: Disaster damage records of EM-DAT and DesInventar: a  systematic comparison, Economics of Disasters and Climate Change, 4,  295–317, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>Papagiannaki et al.(2022)</label><mixed-citation>
      
Papagiannaki, K., Petrucci, O., Diakakis, M., Kotroni, V., Aceto, L., Bianchi, C., Brázdil, R., Gelabert, M. G., Inbar, M., Kahraman, A., Özgenur   Kılıç, Krahn, A., Kreibich, H., Llasat, M. C., Llasat-Botija, M.,   Macdonald, N., de Brito, M. M., Mercuri, M., Pereira, S., Řehoř, J., Geli,   J. R., Salvati, P., Vinet, F., and Zêzere, J. L.: Developing a large-scale   dataset of flood fatalities for territories in the Euro-Mediterranean region,   FFEM-DB, Scientific Data, 9, 166, <a href="https://doi.org/10.1038/s41597-022-01273-x" target="_blank">https://doi.org/10.1038/s41597-022-01273-x</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>Paprotny et al.(2024)</label><mixed-citation>
      
Paprotny, D., Terefenko, P., and Śledziowski, J.: HANZE v2.1: an improved database of flood impacts in Europe from 1870 to 2020, Earth Syst. Sci. Data, 16, 5145–5170, <a href="https://doi.org/10.5194/essd-16-5145-2024" target="_blank">https://doi.org/10.5194/essd-16-5145-2024</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>Rosvold and Buhaug(2021)</label><mixed-citation>
      
Rosvold, E. L. and Buhaug, H.: GDIS, a global dataset of geocoded disaster  locations, Scientific data, 8, 61, <a href="https://doi.org/10.1038/s41597-021-00846-6" target="_blank">https://doi.org/10.1038/s41597-021-00846-6</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>Sanh et al.(2019)</label><mixed-citation>
      
Sanh, V., Debut, L., Chaumond, J., and Wolf, T.: DistilBERT, a distilled  version of BERT: smaller, faster, cheaper and lighter, arXiv [preprint], <a href="https://doi.org/10.48550/arXiv.1910.01108" target="_blank">https://doi.org/10.48550/arXiv.1910.01108</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>Seneviratne et al.(2021)</label><mixed-citation>
      
Seneviratne, S., Zhang, X., Adnan, M., Badi, W., Dereczynski, C., Di Luca, A., Ghosh, S., Iskandar, I., Kossin, J., Lewis, S., Otto, F., Pinto, I., Satoh, M., Vicente-Serrano, S., Wehner, M., and Zhou, B.: Weather and Climate  Extreme Events in a Changing Climate, Cambridge University Press, Cambridge, United Kingdom and New York, NY, USA, 1513–1766,   <a href="https://doi.org/10.1017/9781009157896.013" target="_blank">https://doi.org/10.1017/9781009157896.013</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>Sodoge et al.(2023)</label><mixed-citation>
      
Sodoge, J., Kuhlicke, C., and de Brito, M. M.: Automatized spatio-temporal  detection of drought impacts from newspaper articles using natural language  processing and machine learning, Weather and Climate Extremes, 41, 100574,
<a href="https://doi.org/10.1016/j.wace.2023.100574" target="_blank">https://doi.org/10.1016/j.wace.2023.100574</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>Stahl et al.(2016)</label><mixed-citation>
      
Stahl, K., Kohn, I., Blauhut, V., Urquijo, J., De Stefano, L., Acácio, V., Dias, S., Stagge, J. H., Tallaksen, L. M., Kampragou, E., Van Loon, A. F., Barker, L. J., Melsen, L. A., Bifulco, C., Musolino, D., de Carli, A., Massarutto, A., Assimacopoulos, D., and Van Lanen, H. A. J.: Impacts of European drought events: insights from an international database of text-based reports, Nat. Hazards Earth Syst. Sci., 16, 801–819, <a href="https://doi.org/10.5194/nhess-16-801-2016" target="_blank">https://doi.org/10.5194/nhess-16-801-2016</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>Teber et al.(2025)</label><mixed-citation>
      
Teber, K., Weynants, M., Gans, F., and Mahecha, M. D.: Geo-Disasters: Geocoding climate-related events in the international disaster database EM-DAT, Big Earth Data, 10, 303–318, <a href="https://doi.org/10.1080/20964471.2025.2576274" target="_blank">https://doi.org/10.1080/20964471.2025.2576274</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>Thiery et al.(2017)</label><mixed-citation>
      
Thiery, W., Gudmundsson, L., Bedka, K., Semazzi, F. H., Lhermitte, S., Willems, P., van Lipzig, N. P., and Seneviratne, S. I.: Early warnings of hazardous thunderstorms over Lake Victoria, Environ. Res. Lett., 12, 074012, <a href="https://doi.org/10.1088/1748-9326/aa7521" target="_blank">https://doi.org/10.1088/1748-9326/aa7521</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>Thiery et al.(2021)</label><mixed-citation>
      
Thiery, W., Lange, S., Rogelj, J., Schleussner, C.-F., Gudmundsson, L.,  Seneviratne, S. I., Andrijevic, M., Frieler, K., Emanuel, K., Geiger, T.,  Bresch, D. N., Zhao, F., Willner, S. N., Büchner, M., Volkholz, J., Bauer,  N., Chang, J., Ciais, P., Dury, M., François, L., Grillakis, M., Gosling,  S. N., Hanasaki, N., Hickler, T., Huber, V., Ito, A., Jägermeyr, J.,  Khabarov, N., Koutroulis, A., Liu, W., Lutz, W., Mengel, M., Müller, C.,  Ostberg, S., Reyer, C. P. O., Stacke, T., and Wada, Y.: Intergenerational  inequities in exposure to climate extremes, Science, 374, 158–160,  <a href="https://doi.org/10.1126/science.abi7339" target="_blank">https://doi.org/10.1126/science.abi7339</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>Tonmoy et al.(2024)</label><mixed-citation>
      
Tonmoy, S. M. T. I., Zaman, S. M. M., Jain, V., Rani, A., Rawte, V., Chadha,  A., and Das, A.: A Comprehensive Survey of Hallucination Mitigation  Techniques in Large Language Models, arXiv [preprint],  <a href="https://doi.org/10.48550/arXiv.2401.01313" target="_blank">https://doi.org/10.48550/arXiv.2401.01313</a>, 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>Tschumi and Zscheischler(2020)</label><mixed-citation>
      
Tschumi, E. and Zscheischler, J.: Countrywide climate features during recorded climate-related disasters, Climatic Change, 158, 593–609, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>UNISDR(2024)</label><mixed-citation>
      
UNISDR: DesInventar: United Nations Office for Disaster Risk Reduction,  <a href="https://www.desinventar.net/" target="_blank"/> (last access: May 2024), 2024.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib51"><label>Wikipedia contributors(2024a)</label><mixed-citation>
      
Wikipedia contributors: 1939 Pacific hurricane season – Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=1939_Pacific_hurricane_season&amp;oldid=1224891091" target="_blank"/>,
(last access: 26 January 2026), 2024a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib52"><label>Wikipedia contributors(2024b)</label><mixed-citation>
      
Wikipedia contributors: Hurricane Nate (2005) – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Hurricane_Nate_(2005)&amp;oldid=1249615441" target="_blank"/>,
(last access: 30 January 2026), 2024b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib53"><label>Wikipedia contributors(2025a)</label><mixed-citation>
      
Wikipedia contributors: 2015 Russian wildfires – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=2015_Russian_wildfires&amp;oldid=1293003396" target="_blank"/>,
(last access: 26 January 2026), 2025a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib54"><label>Wikipedia contributors(2025b)</label><mixed-citation>
      
Wikipedia contributors: 2017 Tulsa tornadoes – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=2017_Tulsa_tornadoes&amp;oldid=1296198946" target="_blank"/>,
(last access: 26 January 2026), 2025b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib55"><label>Wikipedia contributors(2025c)</label><mixed-citation>
      
Wikipedia contributors: 1999 Blayais Nuclear Power Plant flood – Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=1999_Blayais_Nuclear_Power_Plant_flood&amp;oldid=1309899681" target="_blank"/>,
(last access: 26 January 2026), 2025c.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib56"><label>Wikipedia contributors(2025d)</label><mixed-citation>
      
Wikipedia contributors: 2011 European floods – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=2011_European_floods&amp;oldid=1310685507" target="_blank"/>,
(last access: 26 January 2026), 2025d.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib57"><label>Wikipedia contributors(2025e)</label><mixed-citation>
      
Wikipedia contributors: Hurricane Larry – Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Hurricane_Larry&amp;oldid=1315207889" target="_blank"/>,
(last access: 30 January 2026), 2025e.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib58"><label>Wikipedia contributors(2025f)</label><mixed-citation>
      
Wikipedia contributors: List of Nicaragua hurricanes – Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=List_of_Nicaragua_hurricanes&amp;oldid=1319005054" target="_blank"/>,
(last access: 9 April 2026), 2025f.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib59"><label>Wikipedia contributors(2025g)</label><mixed-citation>
      
Wikipedia contributors: Cyclone Vayu – Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Cyclone_Vayu&amp;oldid=1320664862" target="_blank"/>,
(last access: 30 January 2026), 2025g.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib60"><label>Wikipedia contributors(2025h)</label><mixed-citation>
      
Wikipedia contributors: Typhoon Kate – Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Typhoon_Kate&amp;oldid=1321753937" target="_blank"/>,
(last access: 26 January 2026), 2025h.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib61"><label>Wikipedia contributors(2025i)</label><mixed-citation>
      
Wikipedia contributors: Typhoons in Taiwan – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Typhoons_in_Taiwan&amp;oldid=1322603935" target="_blank"/>,
(last access: 9 April 2026), 2025i.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib62"><label>Wikipedia contributors(2025j)</label><mixed-citation>
      
Wikipedia contributors: Tropical cyclones in 2013 – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Tropical_cyclones_in_2013&amp;oldid=1325283599" target="_blank"/>,
(last access: 26 January 2026), 2025j.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib63"><label>Wikipedia contributors(2026a)</label><mixed-citation>
      
Wikipedia contributors: 1983–1985 famine in Ethiopia – Wikipedia, The Free Encyclopedia,
<a href="https://en.wikipedia.org/w/index.php?title=1983-1985_famine_in_Ethiopia&amp;oldid=1332375726" target="_blank"/>,
(last access: 30 January 2026), 2026a.


    </mixed-citation></ref-html>
<ref-html id="bib1.bib64"><label>Wikipedia contributors(2026b)</label><mixed-citation>
      
Wikipedia contributors: 2021 European floods – Wikipedia, The Free   Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=2021_European_floods&amp;oldid=1333089008" target="_blank"/>,
(last access: 26 January 2026), 2026b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib65"><label>Wikipedia contributors(2026c)</label><mixed-citation>
      
Wikipedia contributors: Hurricane Ida – Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Hurricane_Ida&amp;oldid=1333487396" target="_blank"/>,
(last access: 30 January 2026), 2026c.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib66"><label>Wikipedia contributors(2026d)</label><mixed-citation>
      
Wikipedia contributors: Miami Hurricanes football – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Miami_Hurricanes_football&amp;oldid=1334196783" target="_blank"/>,
(last access: 30 January 2026), 2026d.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib67"><label>Wikipedia contributors(2026e)</label><mixed-citation>
      
Wikipedia contributors: 2021 Atlantic hurricane season – Wikipedia, The  Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=2021_Atlantic_hurricane_season&amp;oldid=1335534205" target="_blank"/>,
(last access: 30 January 2026), 2026e.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib68"><label>Wikipedia contributors(2026f)</label><mixed-citation>
      
Wikipedia contributors: Typhoon Talim (2017) – Wikipedia, The Free  Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Typhoon_Talim_(2017)&amp;oldid=1336967505" target="_blank"/>,
(last access: 9 April 2026), 2026f.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib69"><label>Wikipedia contributors(2026g)</label><mixed-citation>
      
Wikipedia contributors: Lists of tornadoes and tornado outbreaks –   Wikipedia, The Free Encyclopedia,  <a href="https://en.wikipedia.org/w/index.php?title=Lists_of_tornadoes_and_tornado_outbreaks&amp;oldid=1343462266" target="_blank"/>,
(last access: 9 April 2026), 2026g.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib70"><label>Worou and Messori(2025)</label><mixed-citation>
      
Worou, K. and Messori, G.: Compounding droughts and floods amplify  socio-economic impacts, Environ. Res. Lett., 20, 104024, <a href="https://doi.org/10.1088/1748-9326/adfe82" target="_blank">https://doi.org/10.1088/1748-9326/adfe82</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib71"><label>Zommers et al.(2020)</label><mixed-citation>
      
Zommers, Z., Marbaix, P., Fischlin, A., Ibrahim, Z. Z., Grant, S., Magnan,  A. K., Pörtner, H.-O., Howden, M., Calvin, K., Warner, K., Thiery, W.,  Sebesvari, Z., Davin, E. L., Evans, J. P., Rosenzweig, C., O’Neill, B. C.,  Patwardhan, A., Warren, R., van Aalst, M. K., and Hulbert, M.: Burning  embers: towards more transparent and robust climate-change risk assessments,  Nature Reviews Earth &amp; Environment, 1, 516–529,  <a href="https://doi.org/10.1038/s43017-020-0088-0" target="_blank">https://doi.org/10.1038/s43017-020-0088-0</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib72"><label>Zscheischler and Seneviratne(2017)</label><mixed-citation>
      
Zscheischler, J. and Seneviratne, S. I.: Dependence of drivers affects risks  associated with compound events, Science Advances, 3, e1700263, <a href="https://doi.org/10.1126/sciadv.1700263" target="_blank">https://doi.org/10.1126/sciadv.1700263</a>, 2017.

    </mixed-citation></ref-html>--></article>
