Zenodo.org will be unavailable for 2 hours on September 29th from 06:00-08:00 UTC. See announcement.

Other Open Access

Annotation Guidelines for Named Entity Recognition, Entity Linking and Stance Detection

Ahmed Hamdi; Elvys Linhares Pontes; Antoine Doucet


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.4574199">
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.4574199</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.4574199"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0002-8964-2135">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0002-8964-2135</dct:identifier>
        <foaf:name>Ahmed Hamdi</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of La Rochelle</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Elvys Linhares Pontes</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of La Rochelle</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Antoine Doucet</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of La Rochelle</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>Annotation Guidelines for Named Entity Recognition, Entity Linking and Stance Detection</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2021</dct:issued>
    <dcat:keyword>annotation guidelines, named antity recognition, entity linking, stance detection</dcat:keyword>
    <frapo:isFundedBy rdf:resource="info:eu-repo/grantAgreement/EC/H2020/770299/"/>
    <schema:funder>
      <foaf:Organization>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">10.13039/100010661</dct:identifier>
        <foaf:name>European Commission</foaf:name>
      </foaf:Organization>
    </schema:funder>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2021-03-02</dct:issued>
    <owl:sameAs rdf:resource="https://zenodo.org/record/4574199"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/4574199</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.4574198"/>
    <dct:isPartOf rdf:resource="https://zenodo.org/communities/newseye"/>
    <owl:versionInfo>v3.1</owl:versionInfo>
    <dct:description>&lt;p&gt;&lt;em&gt;We describe the NewsEye annotation guidelines for named entity recognition, entity linking and stance detection.&lt;/em&gt;&lt;br&gt; &lt;em&gt;While the part of the guidelines on stance detection annotation is new, these guidelines are derived from Impresso&lt;/em&gt; NE annotation guidelines which are derived from Quaero guidelines. Originally designed for the annotation of &amp;ldquo;extended&amp;rdquo; named entities (i.e. more than the 3 or 4 traditional classes) in French speech transcriptions, Quaero guidelines have furthermore been used on historic press corpora. &lt;em&gt;Impresso&lt;/em&gt; guidelines main&amp;rsquo;s difference with respect to Quaero&amp;rsquo;s is &lt;em&gt;reduction&lt;/em&gt;: only a subset of Quaero entity types and components are considered, as well as a subset of linguistic units eligible as named entities. These adaptations result from what we deemed most relevant to annotate in our context, and from time and resource constraints. Despite these adaptations, &lt;em&gt;impresso&lt;/em&gt; annotated corpora will mostly remain compatible with Quaero guidelines.&lt;/p&gt; &lt;p&gt;&amp;nbsp;&lt;/p&gt; &lt;p&gt;These guidelines allowed building a multilingual &lt;a href="https://zenodo.org/record/4573313#.YKzkdKE6-Uk"&gt;dataset&lt;/a&gt; for named entity recognition, entity linking and stance detection in historical newpapers in French, German, Finnish and Swedish. The paper describing the guidelines and the dataset is available here. If you end up using the guidelines or the resource, please cite this &lt;a href="https://zenodo.org/record/4694466#.YKzk2qE6-Uk"&gt;paper&lt;/a&gt;:&lt;/p&gt; &lt;pre&gt;&lt;code&gt;@inproceedings{Hamdi2021multilingual, title={A Multilingual Dataset for Named Entity Recognition, Entity Linking and Stance Detection in Historical Newspapers}, author={Hamdi, Ahmed and Boro{\c{s}}, Emanuela and Pontes, Elvys Linhares and Nguyen, Thi Tuyet Hai and Hackl, G{\"u}nter and Moreno, Jose G and Doucet, Antoine}, booktitle={Proceedings of the 44rd International ACM SIGIR Conference on Research and Development in Information Retrieval}, year={2021} }&lt;/code&gt;&lt;/pre&gt; &lt;p&gt;&lt;strong&gt;Acknowledgments&lt;/strong&gt;&lt;br&gt; This work has been supported by the European Union&amp;#39;s Horizon 2020 research and innovation programme under grant 770299 [NewsEye](https://www.newseye.eu/).&lt;/p&gt;</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dct:license rdf:resource="https://creativecommons.org/licenses/by/4.0/legalcode"/>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.4574199"/>
        <dcat:byteSize>310532</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/4574199/files/v3.1-Guidelines-NewsEye-NER-EL-StD.pdf"/>
        <dcat:mediaType>application/pdf</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
  <foaf:Project rdf:about="info:eu-repo/grantAgreement/EC/H2020/770299/">
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">770299</dct:identifier>
    <dct:title>NewsEye: A Digital Investigator for Historical Newspapers</dct:title>
    <frapo:isAwardedBy>
      <foaf:Organization>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">10.13039/100010661</dct:identifier>
        <foaf:name>European Commission</foaf:name>
      </foaf:Organization>
    </frapo:isAwardedBy>
  </foaf:Project>
</rdf:RDF>
566
465
views
downloads
All versions This version
Views 566566
Downloads 465465
Data volume 144.4 MB144.4 MB
Unique views 508508
Unique downloads 425425

Share

Cite as