{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2026-06-09T17:34:54.604663+00:00",
  "custom_fields": {
    "code:codeRepository": "https://github.com/hipe-eval/HIPE-2026-data"
  },
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "hipe-eval/HIPE-2026-data-v1.0.zip": {
        "access": {
          "hidden": false
        },
        "checksum": "md5:16c53c21f5eec0f66790aa251823a171",
        "ext": "zip",
        "id": "2a6087f1-b9d8-45f0-b9e5-6008f7d46a4e",
        "key": "hipe-eval/HIPE-2026-data-v1.0.zip",
        "links": {
          "container": "https://zenodo.org/api/records/20615690/files/hipe-eval/HIPE-2026-data-v1.0.zip/container",
          "content": "https://zenodo.org/api/records/20615690/files/hipe-eval/HIPE-2026-data-v1.0.zip/content",
          "self": "https://zenodo.org/api/records/20615690/files/hipe-eval/HIPE-2026-data-v1.0.zip"
        },
        "metadata": null,
        "mimetype": "application/zip",
        "size": 1947498,
        "storage_class": "L"
      }
    },
    "order": [],
    "total_bytes": 1947498
  },
  "id": "20615690",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/20615690/access",
    "access_grants": "https://zenodo.org/api/records/20615690/access/grants",
    "access_links": "https://zenodo.org/api/records/20615690/access/links",
    "access_request": "https://zenodo.org/api/records/20615690/access/request",
    "access_users": "https://zenodo.org/api/records/20615690/access/users",
    "archive": "https://zenodo.org/api/records/20615690/files-archive",
    "archive_media": "https://zenodo.org/api/records/20615690/media-files-archive",
    "communities": "https://zenodo.org/api/records/20615690/communities",
    "communities-suggestions": "https://zenodo.org/api/records/20615690/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.20615690",
    "draft": "https://zenodo.org/api/records/20615690/draft",
    "file_modification": "https://zenodo.org/api/records/20615690/file-modification",
    "files": "https://zenodo.org/api/records/20615690/files",
    "latest": "https://zenodo.org/api/records/20615690/versions/latest",
    "latest_html": "https://zenodo.org/records/20615690/latest",
    "media_files": "https://zenodo.org/api/records/20615690/media-files",
    "parent": "https://zenodo.org/api/records/20615689",
    "parent_doi": "https://doi.org/10.5281/zenodo.20615689",
    "parent_doi_html": "https://zenodo.org/doi/10.5281/zenodo.20615689",
    "parent_html": "https://zenodo.org/records/20615689",
    "preview_html": "https://zenodo.org/records/20615690?preview=1",
    "quota_increase": "https://zenodo.org/api/records/20615690/quota-increase",
    "request_deletion": "https://zenodo.org/api/records/20615690/request-deletion",
    "requests": "https://zenodo.org/api/records/20615690/requests",
    "reserve_doi": "https://zenodo.org/api/records/20615690/draft/pids/doi",
    "self": "https://zenodo.org/api/records/20615690",
    "self_doi": "https://doi.org/10.5281/zenodo.20615690",
    "self_doi_html": "https://zenodo.org/doi/10.5281/zenodo.20615690",
    "self_html": "https://zenodo.org/records/20615690",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:20615690/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:20615690/sequence/default",
    "versions": "https://zenodo.org/api/records/20615690/versions"
  },
  "media_files": {
    "count": 0,
    "enabled": false,
    "entries": {},
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "creators": [
      {
        "person_or_org": {
          "family_name": "Juri Opitz",
          "name": "Juri Opitz",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "EPFL-DHLAB"
          }
        ],
        "person_or_org": {
          "family_name": "Maud Ehrmann",
          "name": "Maud Ehrmann",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "University of Zurich"
          }
        ],
        "person_or_org": {
          "family_name": "Andrianos Michail",
          "name": "Andrianos Michail",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "University of Zurich"
          }
        ],
        "person_or_org": {
          "family_name": "Simon Clematide",
          "name": "Simon Clematide",
          "type": "personal"
        }
      }
    ],
    "description": "<h2>HIPE-2026 Data \u2014 v1.0</h2>\n<p><strong><a href=\"https://hipe-eval.github.io/HIPE-2026/\">HIPE-2026</a></strong> is a CLEF 2026 Evaluation Lab on the qualification of <strong>person\u2013place relations in multilingual historical documents</strong> (<em>Who was where, when?</em>). This release contains the complete <strong>v1.0</strong> dataset used during the official evaluation campaign.</p>\n<p><a href=\"https://doi.org/10.5281/zenodo.XXXXXXX\"></a></p>\n<h3>\ud83d\udce6 What's in this release</h3>\n<p>The HIPE-2026 dataset covers <strong>two evaluation domains</strong> across two test sets:</p>\n<ul>\n<li><strong>Domain A \u2014 Historical Newspapers (Test A):</strong> Articles in German, English, and French from the HIPE historical newspaper corpus (derived from HIPE-2022 impresso dataset). Entity annotations and Wikidata links were manually created in HIPE-2022. Person-Places relations were manually annotated for HIPE-2026. Evaluates both <code>at</code> and <code>isAt</code> relations.</li>\n<li><strong>Domain B \u2014 Literary Works (Test B, surprise):</strong> A held-out test set of French literature and history works from the 16th\u201318th centuries, included to assess out-of-domain generalization. Evaluates <code>at</code> only.</li>\n</ul>\n<p>| Split | Domain | Languages | File(s) |\n|---|---|---|---|\n| Train | Newspapers | DE, EN, FR | <code>data/newspapers/v1.0/HIPE-2026-v1.0-impresso-train-*.jsonl</code> |\n| Test | Newspapers | DE, EN, FR | <code>data/newspapers/v1.0/HIPE-2026-v1.0-impresso-test-*.jsonl</code> |\n| Test (masked) | Newspapers | DE, EN, FR | <code>data/newspapers/v1.0/HIPE-2026-v1.0-impresso-test_masked-*.jsonl</code> |\n| Test | Literary works | FR | <code>data/litworks/v1.0/HIPE-2026-v1.0-surprise-test-fr.jsonl</code> |\n| Test (masked) | Literary works | FR | <code>data/litworks/v1.0/HIPE-2026-v1.0-surprise-test_masked-fr.jsonl</code> |</p>\n<p>For detailed information on tasks, datasets, and evaluation protocol, refer to the <a href=\"https://zenodo.org/records/20082076\">CLEF HIPE-2026 Shared Task Participation Guidelines</a>.</p>\n<h3>\ud83d\udd2c Reproducing the official evaluation</h3>\n<p>The full campaign evaluation \u2014 including reference data, participant submissions, and the evaluation orchestrator \u2014 is available at:\n\ud83d\udc49 <a href=\"https://github.com/hipe-eval/hipe-2026-eval\">https://github.com/hipe-eval/hipe-2026-eval</a></p>\n<h3>\ud83d\udcd0 Data format</h3>\n<p>Data is distributed as UTF-8 JSON Lines (<code>.jsonl</code>). Each line is one document with OCR text, document metadata, and sampled person\u2013location pairs. Prediction targets are:</p>\n<ul>\n<li><code>at</code> \u2014 evidence that a person was at a location at any time before publication (<code>TRUE</code>, <code>FALSE</code>, <code>PROBABLE</code>, <code>null</code>)</li>\n<li><code>isAt</code> \u2014 evidence of presence within ~one month before publication (<code>TRUE</code>, <code>FALSE</code>, <code>null</code>)</li>\n</ul>\n<p>The full schema is in <a href=\"schemas/hipe-2026-data.schema.json\"><code>schemas/hipe-2026-data.schema.json</code></a>. See the <a href=\"README.md\">README</a> for format details, validation, and a prediction/evaluation walkthrough.</p>\n<h3>\ud83d\udcd6 How to cite</h3>\n<blockquote>\n<p>Juri Opitz, Corina Racl\u00e9, Andrianos Michail, Matteo Romanello, Emanuela Boros, Simon Gabay, Maud Ehrmann, and Simon Clematide. 2026. <strong>Extended Overview of HIPE-2026: Evaluating Accurate and Efficient Person\u2013Place Relation Extraction from Multilingual Historical Texts</strong>. In <em>CLEF 2026 Working Notes, CEUR Workshop Proceedings</em>. https://doi.org/10.5281/zenodo.20344461</p>\n</blockquote>\n<h3>\ud83d\udcdc License</h3>\n<p>Released under <a href=\"https://creativecommons.org/licenses/by-nc-sa/4.0/\">CC BY-NC-SA 4.0</a>.</p>\n<p><em>HIPE-2026 is organised within the <a href=\"https://impresso-project.ch/\">Impresso</a> project, funded by the Swiss National Science Foundation (grant CRSII5_213585) and the Luxembourg National Research Fund (grant 17498891).</em></p>",
    "publication_date": "2026-06-09",
    "publisher": "Zenodo",
    "related_identifiers": [
      {
        "identifier": "https://github.com/hipe-eval/HIPE-2026-data/tree/v1.0",
        "relation_type": {
          "id": "issupplementto",
          "title": {
            "de": "Erg\u00e4nzt",
            "en": "Is supplement to"
          }
        },
        "resource_type": {
          "id": "software",
          "title": {
            "de": "Software",
            "en": "Software"
          }
        },
        "scheme": "url"
      }
    ],
    "resource_type": {
      "id": "dataset",
      "title": {
        "de": "Datensatz",
        "en": "Dataset"
      }
    },
    "rights": [
      {
        "description": {
          "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited."
        },
        "icon": "cc-by-icon",
        "id": "cc-by-4.0",
        "props": {
          "scheme": "spdx",
          "url": "https://creativecommons.org/licenses/by/4.0/legalcode"
        },
        "title": {
          "en": "Creative Commons Attribution 4.0 International"
        }
      }
    ],
    "title": "HIPE-2026 Shared Task Person-Place Relation Dataset",
    "version": "v1.0"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "44474"
      },
      "settings": {
        "accept_conditions_text": null,
        "allow_guest_requests": false,
        "allow_user_requests": false,
        "secret_link_expiration": 0
      }
    },
    "communities": {
      "default": "e054c200-d2d3-43c8-af38-c9813962ee5c",
      "entries": [
        {
          "access": {
            "member_policy": "open",
            "members_visibility": "public",
            "record_submission_policy": "open",
            "review_policy": "open",
            "visibility": "public"
          },
          "children": {
            "allow": false
          },
          "created": "2022-02-11T13:17:33.651553+00:00",
          "custom_fields": {},
          "deletion_status": {
            "is_deleted": false,
            "status": "P"
          },
          "id": "e054c200-d2d3-43c8-af38-c9813962ee5c",
          "links": {},
          "metadata": {
            "curation_policy": "<p>The HIPE-EVAL Zenodo community is for datasets, guidelines and papers related to the HIPE shared tasks.</p>\r\n",
            "description": "HIPE is a series of evaluation campaigns on named entity processing on historical documents in multiple languages.",
            "page": "<p>HIPE is a series of evaluation campaigns on named entity processing on historical documents in multiple languages.</p>\r\n",
            "title": "HIPE evaluation campaigns"
          },
          "revision_id": 0,
          "slug": "hipe-eval",
          "updated": "2022-02-11T13:18:06.841769+00:00"
        }
      ],
      "ids": [
        "e054c200-d2d3-43c8-af38-c9813962ee5c"
      ]
    },
    "id": "20615689",
    "pids": {
      "doi": {
        "client": "datacite",
        "identifier": "10.5281/zenodo.20615689",
        "provider": "datacite"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.20615690",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:20615690",
      "provider": "oai"
    }
  },
  "revision_id": 6,
  "stats": {
    "all_versions": {
      "data_volume": 5842494.0,
      "downloads": 3,
      "unique_downloads": 3,
      "unique_views": 17,
      "views": 18
    },
    "this_version": {
      "data_volume": 5842494.0,
      "downloads": 3,
      "unique_downloads": 3,
      "unique_views": 17,
      "views": 18
    }
  },
  "status": "published",
  "swh": {},
  "updated": "2026-06-09T17:38:25.681348+00:00",
  "versions": {
    "index": 1,
    "is_latest": true
  }
}