Dataset Open Access

Extracted Illustrations of the Berlin State Library's Digitized Collections (part 3 of 4)

Zellhöfer, David


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.2598261">
    <rdf:type rdf:resource="http://www.w3.org/ns/dcat#Dataset"/>
    <dct:type rdf:resource="http://purl.org/dc/dcmitype/Dataset"/>
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.2598261</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.2598261"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0002-0403-457X">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0002-0403-457X</dct:identifier>
        <foaf:name>Zellhöfer, David</foaf:name>
        <foaf:givenName>David</foaf:givenName>
        <foaf:familyName>Zellhöfer</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Berlin State Library</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>Extracted Illustrations of the Berlin State Library's Digitized Collections (part 3 of 4)</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2019</dct:issued>
    <dcat:keyword>digital library</dcat:keyword>
    <dcat:keyword>digitized content</dcat:keyword>
    <dcat:keyword>CBIR</dcat:keyword>
    <dcat:keyword>image segments</dcat:keyword>
    <dcat:keyword>illustrations</dcat:keyword>
    <dcat:keyword>historical books</dcat:keyword>
    <dcat:keyword>JPEG</dcat:keyword>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2019-03-19</dct:issued>
    <owl:sameAs rdf:resource="https://zenodo.org/record/2598261"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/2598261</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.2598260"/>
    <dct:isPartOf rdf:resource="https://zenodo.org/communities/stabi"/>
    <owl:versionInfo>1.0</owl:versionInfo>
    <dct:description>&lt;p&gt;&lt;strong&gt;This is part 3 of 4. The following dataset contains a reference the other ZIP files: &lt;/strong&gt;&lt;/p&gt; &lt;pre&gt;https://doi.org/10.5281/zenodo.2598101&lt;/pre&gt; &lt;p&gt;The dataset consists of various illustrations extracted from 26,233 historical books and other media offered in the Berlin State Library&amp;#39;s Digitized Collections. The media objects are older than 1920.&lt;/p&gt; &lt;p&gt;Version 1.0 contains of 594,890 extracted illustrations in total.&lt;/p&gt; &lt;p&gt;The extraction of illustrations is driven by the coordinates given by the ABBYY FineReader OCR engine (in ALTO XML) . The extracted illustrations have not been resized but compressed and saved in JPEG format.&lt;/p&gt; &lt;p&gt;Pre-trained models in order to separate color scales, hand-written signatures, library stamps or the like from interesting content are available under: &lt;a href="https://github.com/elektrobohemian/imi-unicorns"&gt;https://github.com/elektrobohemian/imi-unicorns&lt;/a&gt;.&lt;/p&gt; &lt;p&gt;The extracts for each media object are stored in separated sub-folders and tar files named after the PPN (a unique ID used in the library) to facilitate further processing. Additional metadata can be obtained with help of the PPN as described here: &lt;a href="https://github.com/elektrobohemian/StabiHacks/blob/master/ppn-howto.md"&gt;https://github.com/elektrobohemian/StabiHacks/blob/master/ppn-howto.md&lt;/a&gt; .&lt;/p&gt; &lt;p&gt;The dataset is published as a set of ZIP files, each fitting on a Blu Ray disc. &lt;strong&gt;After decompression, the contents will consume ca. 166 GB.&lt;/strong&gt;&lt;/p&gt; &lt;p&gt;&lt;strong&gt;This is part 3 of 4. The following dataset contains a reference the other ZIP files: &lt;/strong&gt;&lt;/p&gt; &lt;pre&gt;https://doi.org/10.5281/zenodo.2598101&lt;/pre&gt;</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dcat:distribution>
      <dcat:Distribution>
        <dct:license rdf:resource="https://creativecommons.org/licenses/by/4.0/legalcode"/>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.2598261"/>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.2598261"/>
        <dcat:byteSize>24159191040</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/2598261/files/extracted_images.zip.005"/>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.2598261"/>
        <dcat:byteSize>24159191040</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/2598261/files/extracted_images.zip.006"/>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
</rdf:RDF>
47
63
views
downloads
All versions This version
Views 4747
Downloads 6363
Data volume 1.5 TB1.5 TB
Unique views 4545
Unique downloads 3434

Share

Cite as