Dataset Open Access

ICDAR 2019 Competition on Image Retrieval for Historical Handwritten Documents [HisIR19] Dataset

Christlein, Vincent; Nicolaou, Anguelos; Seuret, Mathias; Stutzmann, Dominique; Maier, Andreas


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.3262372">
    <rdf:type rdf:resource="http://www.w3.org/ns/dcat#Dataset"/>
    <dct:type rdf:resource="http://purl.org/dc/dcmitype/Dataset"/>
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.3262372</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.3262372"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0003-0455-3799">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0003-0455-3799</dct:identifier>
        <foaf:name>Christlein, Vincent</foaf:name>
        <foaf:givenName>Vincent</foaf:givenName>
        <foaf:familyName>Christlein</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Pattern Recognition Lab, FAU</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Nicolaou, Anguelos</foaf:name>
        <foaf:givenName>Anguelos</foaf:givenName>
        <foaf:familyName>Nicolaou</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Pattern Recognition Lab, FAU</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Seuret, Mathias</foaf:name>
        <foaf:givenName>Mathias</foaf:givenName>
        <foaf:familyName>Seuret</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Pattern Recognition Lab, FAU</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Stutzmann, Dominique</foaf:name>
        <foaf:givenName>Dominique</foaf:givenName>
        <foaf:familyName>Stutzmann</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>IRHT</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0002-9550-5284">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0002-9550-5284</dct:identifier>
        <foaf:name>Maier, Andreas</foaf:name>
        <foaf:givenName>Andreas</foaf:givenName>
        <foaf:familyName>Maier</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Pattern Recognition Lab, FAU</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>ICDAR 2019 Competition on Image Retrieval for Historical Handwritten Documents [HisIR19] Dataset</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2019</dct:issued>
    <dcat:keyword>writer retrieval</dcat:keyword>
    <dcat:keyword>image retrieval</dcat:keyword>
    <dcat:keyword>writer identification</dcat:keyword>
    <dcat:keyword>document analysis</dcat:keyword>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2019-06-30</dct:issued>
    <owl:sameAs rdf:resource="https://zenodo.org/record/3262372"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/3262372</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <dct:relation rdf:resource="https://doi.org/10.5281/zenodo.1324999"/>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.3262371"/>
    <owl:versionInfo>1.0</owl:versionInfo>
    <dct:description>&lt;p&gt;This dataset contains the training and test set used in the ICDAR 2019 Competition on Image Retrieval for Historical Handwritten Documents.&lt;/p&gt; &lt;p&gt;This competition investigates the performance of large-scale retrieval of historical document images based on&lt;br&gt; writing style. Based on large image data sets provided by cultural heritage institutions and digital libraries, providing&lt;br&gt; a total of 20 000 document images representing about 10 000 writers, divided in three types: writers of (i) manuscript books, (ii) letters, (iii) charters and legal documents. We focus on the task of automatic image retrieval to simulate common scenarios of humanities research, such as writer retrieval.&lt;/p&gt; &lt;p&gt;The training data set encompasses images from (i) Letters A, where each writer contributed one or three images; (ii) Manuscripts, where each writer was represented by five consecutive images from a single book.&lt;br&gt; In total, it contains 300 writers contributing one page, 100 writers contributing three pages, and 120 writers contributing five pages resulting in 1200 images of 520 writers.&lt;/p&gt; &lt;p&gt;The test data set contains 20 000 images: About 7 500 pages stem from isolated documents (partially anonymous writers, contributing one page each), and about 12 500 pages are from writers that contributed three or five pages.&lt;/p&gt; &lt;p&gt;&amp;nbsp;&lt;/p&gt; &lt;p&gt;If you use this dataset, please cite:&lt;/p&gt; &lt;p&gt;V. Christlein, A. Nicolaou, M. Seuret, D. Stutzmann, A. Maier: &amp;quot;ICDAR 2019 Competition on Image Retrieval for Historical Handwritten Documents&amp;quot;, in 15th International Conference on Document Analysis and Recognition, 2019, Sydney, Australia&lt;/p&gt; &lt;p&gt;&amp;nbsp;&lt;/p&gt;</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dcat:distribution>
      <dcat:Distribution>
        <dct:license rdf:resource="https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode"/>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372"/>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372">https://doi.org/10.5281/zenodo.3262372</dcat:accessURL>
        <dcat:byteSize>1156</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3262372/files/README.txt">https://zenodo.org/record/3262372/files/README.txt</dcat:downloadURL>
        <dcat:mediaType>text/plain</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372">https://doi.org/10.5281/zenodo.3262372</dcat:accessURL>
        <dcat:byteSize>2597101</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3262372/files/test_meta.csv">https://zenodo.org/record/3262372/files/test_meta.csv</dcat:downloadURL>
        <dcat:mediaType>text/csv</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372">https://doi.org/10.5281/zenodo.3262372</dcat:accessURL>
        <dcat:byteSize>188886</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3262372/files/val_meta.csv">https://zenodo.org/record/3262372/files/val_meta.csv</dcat:downloadURL>
        <dcat:mediaType>text/csv</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372">https://doi.org/10.5281/zenodo.3262372</dcat:accessURL>
        <dcat:byteSize>26182765342</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3262372/files/wi_comp_19_test_full.zip">https://zenodo.org/record/3262372/files/wi_comp_19_test_full.zip</dcat:downloadURL>
        <dcat:mediaType>application/zip</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372">https://doi.org/10.5281/zenodo.3262372</dcat:accessURL>
        <dcat:byteSize>485223</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3262372/files/wi_comp19_test_ground_truth.csv">https://zenodo.org/record/3262372/files/wi_comp19_test_ground_truth.csv</dcat:downloadURL>
        <dcat:mediaType>text/csv</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372">https://doi.org/10.5281/zenodo.3262372</dcat:accessURL>
        <dcat:byteSize>18202</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3262372/files/wi_comp_19val_ground_truth.csv">https://zenodo.org/record/3262372/files/wi_comp_19val_ground_truth.csv</dcat:downloadURL>
        <dcat:mediaType>text/csv</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3262372">https://doi.org/10.5281/zenodo.3262372</dcat:accessURL>
        <dcat:byteSize>2775958128</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3262372/files/wi_comp_19_validation.zip">https://zenodo.org/record/3262372/files/wi_comp_19_validation.zip</dcat:downloadURL>
        <dcat:mediaType>application/zip</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
</rdf:RDF>
1,038
722
views
downloads
All versions This version
Views 1,0381,039
Downloads 722721
Data volume 5.4 TB5.4 TB
Unique views 941942
Unique downloads 332331

Share

Cite as