{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2020-03-31T08:09:34.653463+00:00",
  "custom_fields": {},
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "semeval2020_ulscd_lat.zip": {
        "checksum": "md5:e7c60d2877d8f7b00ac60f2dab4a66f0",
        "ext": "zip",
        "id": "ca4b551b-743b-4b03-a013-ca2e5e2c016d",
        "key": "semeval2020_ulscd_lat.zip",
        "metadata": null,
        "mimetype": "application/zip",
        "size": 28445562
      }
    },
    "order": [],
    "total_bytes": 28445562
  },
  "id": "3734089",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/3734089/access",
    "access_grants": "https://zenodo.org/api/records/3734089/access/grants",
    "access_links": "https://zenodo.org/api/records/3734089/access/links",
    "access_request": "https://zenodo.org/api/records/3734089/access/request",
    "access_users": "https://zenodo.org/api/records/3734089/access/users",
    "archive": "https://zenodo.org/api/records/3734089/files-archive",
    "archive_media": "https://zenodo.org/api/records/3734089/media-files-archive",
    "communities": "https://zenodo.org/api/records/3734089/communities",
    "communities-suggestions": "https://zenodo.org/api/records/3734089/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.3734089",
    "draft": "https://zenodo.org/api/records/3734089/draft",
    "files": "https://zenodo.org/api/records/3734089/files",
    "latest": "https://zenodo.org/api/records/3734089/versions/latest",
    "latest_html": "https://zenodo.org/records/3734089/latest",
    "media_files": "https://zenodo.org/api/records/3734089/media-files",
    "parent": "https://zenodo.org/api/records/3674098",
    "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.3674098",
    "parent_html": "https://zenodo.org/records/3674098",
    "requests": "https://zenodo.org/api/records/3734089/requests",
    "reserve_doi": "https://zenodo.org/api/records/3734089/draft/pids/doi",
    "self": "https://zenodo.org/api/records/3734089",
    "self_doi": "https://zenodo.org/doi/10.5281/zenodo.3734089",
    "self_html": "https://zenodo.org/records/3734089",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:3734089/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:3734089/sequence/default",
    "versions": "https://zenodo.org/api/records/3734089/versions"
  },
  "media_files": {
    "count": 0,
    "enabled": false,
    "entries": {},
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "creators": [
      {
        "affiliations": [
          {
            "name": "University of Cambridge"
          }
        ],
        "person_or_org": {
          "family_name": "McGillivray",
          "given_name": "Barbara",
          "name": "McGillivray, Barbara",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "IMS, University of Stuttgart"
          }
        ],
        "person_or_org": {
          "family_name": "Schlechtweg",
          "given_name": "Dominik",
          "name": "Schlechtweg, Dominik",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "University of Cambridge"
          }
        ],
        "person_or_org": {
          "family_name": "Dubossarsky",
          "given_name": "Haim",
          "name": "Dubossarsky, Haim",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "University of Gothenburg"
          }
        ],
        "person_or_org": {
          "family_name": "Tahmasebi",
          "given_name": "Nina",
          "name": "Tahmasebi, Nina",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "University of Helsinki"
          }
        ],
        "person_or_org": {
          "family_name": "Hengchen",
          "given_name": "Simon",
          "name": "Hengchen, Simon",
          "type": "personal"
        }
      }
    ],
    "description": "<p>This data collection contains the Latin test data for <a href=\"https://competitions.codalab.org/competitions/20948\">SemEval 2020 Task 1: Unsupervised Lexical Semantic Change Detection</a>:&nbsp;</p>\n\n<ul>\n\t<li>a Latin text corpus pair (`corpus1/lemma`, `corpus2/lemma`)</li>\n\t<li>40 lemmas which have been annotated for their lexical semantic change between the two corpora (`targets.txt`)</li>\n\t<li>the annotated binary change scores of the targets for subtask 1, and their annotated graded change scores for subtask 2 (`truth/`)</li>\n</ul>\n\n<p>The corpus data have been automatically lemmatized and part-of-speech tagged, and have been partially corrected by hand. For homonyms, the lemmas are followed by the &#39;\\#&#39; symbol and the number of the homonym according to the Lewis-Short dictionary of Latin when this number is greater than 1. For example, the lemma &#39;dico&#39; corresponds to the first homonym in the Lewis-Short dictionary and &#39;dico\\#2&#39; corresponds to the second homonym, cf. Lewis-Short dictionary.</p>\n\n<p>__Corpus 1__</p>\n\n<ul>\n\t<li>based on: <a href=\"http://hdl.handle.net/11372/LRT-3170\">LatinISE</a>&nbsp;(McGillivray and Kilgarriff 2013), <a href=\"https://app.sketchengine.eu/#dashboard?corpname=preloaded/latinise_4\">version on Sketch Engine</a></li>\n\t<li>language: Latin</li>\n\t<li>time covered: from the beginning of the second century before Christ (BC) to the end of the first century BC</li>\n\t<li>size: ~1.7 million tokens</li>\n\t<li>format: lemmatized, sentence length &gt;= 2, no punctuation, sentences randomly shuffled</li>\n\t<li>encoding: UTF-8</li>\n</ul>\n\n<p>__Corpus 2__</p>\n\n<ul>\n\t<li>based on: <a href=\"http://hdl.handle.net/11372/LRT-3170\">LatinISE</a>&nbsp;(McGillivray and Kilgarriff 2013) , <a href=\"https://app.sketchengine.eu/#dashboard?corpname=preloaded/latinise_4\">version on Sketch Engine</a></li>\n\t<li>language: Latin</li>\n\t<li>time covered: from the beginning of the first century after Christ (AD) to the end of the twenty-first century AD</li>\n\t<li>size: ~9.4 million tokens</li>\n\t<li>format: lemmatized, sentence length &gt;= 2, no punctuation, sentences randomly shuffled</li>\n\t<li>encoding: UTF-8</li>\n</ul>\n\n<p>Find more information on the data in the papers referenced below.</p>\n\n<p><strong>References</strong></p>\n\n<p>Dominik Schlechtweg, Barbara McGillivray, Simon Hengchen, Haim Dubossarsky and Nina Tahmasebi <a href=\"https://competitions.codalab.org/competitions/20948\">SemEval 2020 Task 1: Unsupervised Lexical Semantic Change Detection</a>. To appear in SemEval@COLING2020.</p>\n\n<p>McGillivray, B. and Kilgarriff, A. (2013). <a href=\"https://www.sketchengine.co.uk/wp-content/uploads/2015/05/Latin_historical_corpus_2013.pdf\">Tools for historical corpus research, and a corpus of Latin</a>. In Paul Bennett, Martin Durrell, Silke Scheible, Richard J. Whitt (eds.), New Methods in Historical Corpus Linguistics, T&uuml;bingen: Narr.<br>\n&nbsp;</p>",
    "funding": [
      {
        "award": {
          "id": "001aqnf71::EP/N510129/1",
          "number": "EP/N510129/1",
          "program": "EPSRC",
          "title": {
            "en": "The Alan Turing Institute"
          }
        },
        "funder": {
          "id": "001aqnf71",
          "name": "UK Research and Innovation"
        }
      }
    ],
    "languages": [
      {
        "id": "lat",
        "title": {
          "en": "Latin"
        }
      }
    ],
    "publication_date": "2020-03-31",
    "publisher": "Zenodo",
    "resource_type": {
      "id": "dataset",
      "title": {
        "de": "Datensatz",
        "en": "Dataset"
      }
    },
    "rights": [
      {
        "description": {
          "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited."
        },
        "icon": "cc-by-icon",
        "id": "cc-by-4.0",
        "props": {
          "scheme": "spdx",
          "url": "https://creativecommons.org/licenses/by/4.0/legalcode"
        },
        "title": {
          "en": "Creative Commons Attribution 4.0 International"
        }
      }
    ],
    "subjects": [
      {
        "subject": "Latin, corpus"
      }
    ],
    "title": "LatinISE test data for SemEval 2020 task 1",
    "version": "2"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "37947"
      }
    },
    "communities": {},
    "id": "3674098",
    "pids": {
      "doi": {
        "client": "datacite",
        "identifier": "10.5281/zenodo.3674098",
        "provider": "datacite"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.3734089",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:3734089",
      "provider": "oai"
    }
  },
  "revision_id": 3,
  "stats": {
    "all_versions": {
      "data_volume": 26497155772.0,
      "downloads": 809,
      "unique_downloads": 709,
      "unique_views": 1943,
      "views": 2144
    },
    "this_version": {
      "data_volume": 3925487556.0,
      "downloads": 138,
      "unique_downloads": 116,
      "unique_views": 496,
      "views": 536
    }
  },
  "status": "published",
  "updated": "2020-08-20T14:02:18.502562+00:00",
  "versions": {
    "index": 3,
    "is_latest": false
  }
}