Dataset Open Access

PAN Plagiarism Corpus 2010 (PAN-PC-10)

Potthast, Martin; Stein, Benno; Eiselt, Andreas; Barrón-Cedeño, Alberto; Rosso, Paolo


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.3250123">
    <rdf:type rdf:resource="http://www.w3.org/ns/dcat#Dataset"/>
    <dct:type rdf:resource="http://purl.org/dc/dcmitype/Dataset"/>
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.3250123</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.3250123"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0003-2451-0665">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0003-2451-0665</dct:identifier>
        <foaf:name>Potthast, Martin</foaf:name>
        <foaf:givenName>Martin</foaf:givenName>
        <foaf:familyName>Potthast</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Bauhaus-Universität Weimar</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0001-9033-2217">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0001-9033-2217</dct:identifier>
        <foaf:name>Stein, Benno</foaf:name>
        <foaf:givenName>Benno</foaf:givenName>
        <foaf:familyName>Stein</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Bauhaus-Universität Weimar</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Eiselt, Andreas</foaf:name>
        <foaf:givenName>Andreas</foaf:givenName>
        <foaf:familyName>Eiselt</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Bauhaus-Universität Weimar</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Barrón-Cedeño, Alberto</foaf:name>
        <foaf:givenName>Alberto</foaf:givenName>
        <foaf:familyName>Barrón-Cedeño</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Universidad Polytécnica de Valencia</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Rosso, Paolo</foaf:name>
        <foaf:givenName>Paolo</foaf:givenName>
        <foaf:familyName>Rosso</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Universidad Polytécnica de Valencia</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>PAN Plagiarism Corpus 2010 (PAN-PC-10)</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2010</dct:issued>
    <dcat:keyword>plagiarism</dcat:keyword>
    <dcat:keyword>plagiarism detection</dcat:keyword>
    <dcat:keyword>documents</dcat:keyword>
    <dcat:keyword>PAN</dcat:keyword>
    <dcat:keyword>2010</dcat:keyword>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2010-05-01</dct:issued>
    <dct:language rdf:resource="http://publications.europa.eu/resource/authority/language/ENG"/>
    <owl:sameAs rdf:resource="https://zenodo.org/record/3250123"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/3250123</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.3250122"/>
    <dct:isPartOf rdf:resource="https://zenodo.org/communities/pan"/>
    <dct:isPartOf rdf:resource="https://zenodo.org/communities/webis"/>
    <dct:description>&lt;p&gt;This corpus is outdated. Please use its successor PAN-PC-11: https://doi.org/10.5281/zenodo.3250095&lt;/p&gt; &lt;p&gt;The PAN plagiarism corpus 2010 (PAN-PC-10) is a corpus for the evaluation of automatic plagiarism detection algorithms. For research purposes the corpus can be used free of charge.&lt;/p&gt; &lt;p&gt;The PAN-PC-10 contains documents in which artificial plagiarism has been inserted automatically as well as documents in which simulated plagiarism has been inserted manually. The former have been constructed using a so-called random plagiarist, a computer program which constructs plagiarism according to a number of parameters, while the latter have been obtained with crowdsourcing via Amazon&amp;#39;s Mechanical Turk.&lt;/p&gt;</dct:description>
    <dct:description>{"references": ["Alberto Barr\u00f3n-Cede\u00f1o, Martin Potthast, Paolo Rosso, Benno Stein, and Andreas Eiselt. Corpus and Evaluation Measures for Automatic Plagiarism Detection. In Nicoletta Calzolari et al, editors, 7th Conference on International Language Resources and Evaluation (LREC 10), May 2010. European Language Resources Association (ELRA). ISBN 2-9517408-6-7."]}</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dcat:distribution>
      <dcat:Distribution>
        <dct:license rdf:resource="https://creativecommons.org/licenses/by/4.0/legalcode"/>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3250123"/>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3250123"/>
        <dcat:byteSize>1073741824</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3250123/files/pan-plagiarism-corpus-2010.part1.rar"/>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3250123"/>
        <dcat:byteSize>700199388</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3250123/files/pan-plagiarism-corpus-2010.part2.rar"/>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
</rdf:RDF>
624
426
views
downloads
All versions This version
Views 624625
Downloads 426426
Data volume 388.3 GB388.3 GB
Unique views 570571
Unique downloads 191191

Share

Cite as