Presentation Open Access

Non-source items are a serious problem everywhere

Mayr, Philipp


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.4021225">
    <rdf:type rdf:resource="http://www.w3.org/ns/dcat#Dataset"/>
    <dct:type rdf:resource="http://purl.org/dc/dcmitype/Text"/>
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.4021225</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.4021225"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0002-6656-1658">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0002-6656-1658</dct:identifier>
        <foaf:name>Mayr, Philipp</foaf:name>
        <foaf:givenName>Philipp</foaf:givenName>
        <foaf:familyName>Mayr</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>GESIS - Leibniz-Institute for the Social Sciences</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>Non-source items are a serious problem everywhere</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2020</dct:issued>
    <dcat:keyword>reference extraction, non-source items, bibliographic databases</dcat:keyword>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2020-09-09</dct:issued>
    <dct:language rdf:resource="http://publications.europa.eu/resource/authority/language/ENG"/>
    <owl:sameAs rdf:resource="https://zenodo.org/record/4021225"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/4021225</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.4021224"/>
    <dct:isPartOf rdf:resource="https://zenodo.org/communities/osr"/>
    <dct:description>&lt;p&gt;Making bibliographic data available for researchers, scholars and others is important in all disciplines to ensure easy and fast access to the literature and other scientific resources such as research datasets. Our previous project EXCITE has addressed this problem and narrowed the gap between the availability of citation data in the social sciences. EXCITE has researched, developed, and deployed powerful tools (https://github.com/exciteproject/) that localize, extract and segment reference strings in PDF documents and then match them against bibliographic databases. One of the main conclusions derived from EXCITE is that the metadata of approx. 60% of the cited papers and other scientific resources are outside of available bibliographic databases. The extracted reference strings (items) that could not be matched are called &amp;ldquo;non-source items&amp;rdquo; (NSI). NSI include incomplete or erroneous references as well as references that indeed do not exist in the available bibliographic databases, especially references to datasets, websites and other material. This talk will highlight the significance of NSI for citation matching and suggest possible algorithms to reduce the amount of NSI in digital libraries.&lt;/p&gt; &lt;p&gt;Presentation given at the&amp;nbsp;Workshop On Open Citations And Open Scholarly Metadata 2020 (Virtual Event)&lt;/p&gt;</dct:description>
    <dct:description>Presentation given at the Workshop On Open Citations And Open Scholarly Metadata 2020 (Virtual Event)</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dcat:distribution>
      <dcat:Distribution>
        <dct:license rdf:resource="https://creativecommons.org/licenses/by/4.0/legalcode"/>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.4021225"/>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL>https://doi.org/10.5281/zenodo.4021225</dcat:accessURL>
        <dcat:byteSize>2012853</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/4021225/files/non-source-items_wooc20.pptx">https://zenodo.org/record/4021225/files/non-source-items_wooc20.pptx</dcat:downloadURL>
        <dcat:mediaType>application/vnd.openxmlformats-officedocument.presentationml.presentation</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
</rdf:RDF>
66
15
views
downloads
All versions This version
Views 6666
Downloads 1515
Data volume 30.2 MB30.2 MB
Unique views 6161
Unique downloads 1313

Share

Cite as