{ "access": { "embargo": { "active": false, "reason": null }, "files": "public", "record": "public", "status": "open" }, "created": "2022-07-18T18:35:52.260204+00:00", "custom_fields": { "meeting:meeting": { "acronym": "DAS", "dates": "22-25 May 2022", "title": "15th IAPR International Workshop on Document Analysis System", "url": "https://das2022.univ-lr.fr/index.php/important-dates/" } }, "deletion_status": { "is_deleted": false, "status": "P" }, "files": { "count": 1, "enabled": true, "entries": { "VMP_HP_ext_v2.zip": { "checksum": "md5:c9114f5e91db7793ba602db7ed53c2c9", "ext": "zip", "id": "fdcc3ab9-43ba-4d82-a3a2-99a6434565e8", "key": "VMP_HP_ext_v2.zip", "metadata": null, "mimetype": "application/zip", "size": 2152473175 } }, "order": [], "total_bytes": 2152473175 }, "id": "6856934", "is_draft": false, "is_published": true, "links": { "access": "https://zenodo.org/api/records/6856934/access", "access_links": "https://zenodo.org/api/records/6856934/access/links", "access_request": "https://zenodo.org/api/records/6856934/access/request", "access_users": "https://zenodo.org/api/records/6856934/access/users", "archive": "https://zenodo.org/api/records/6856934/files-archive", "archive_media": "https://zenodo.org/api/records/6856934/media-files-archive", "communities": "https://zenodo.org/api/records/6856934/communities", "communities-suggestions": "https://zenodo.org/api/records/6856934/communities-suggestions", "doi": "https://doi.org/10.5281/zenodo.6856934", "draft": "https://zenodo.org/api/records/6856934/draft", "files": "https://zenodo.org/api/records/6856934/files", "latest": "https://zenodo.org/api/records/6856934/versions/latest", "latest_html": "https://zenodo.org/records/6856934/latest", "media_files": "https://zenodo.org/api/records/6856934/media-files", "parent": "https://zenodo.org/api/records/6387470", "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.6387470", "parent_html": "https://zenodo.org/records/6387470", "requests": "https://zenodo.org/api/records/6856934/requests", "reserve_doi": "https://zenodo.org/api/records/6856934/draft/pids/doi", "self": "https://zenodo.org/api/records/6856934", "self_doi": "https://zenodo.org/doi/10.5281/zenodo.6856934", "self_html": "https://zenodo.org/records/6856934", "self_iiif_manifest": "https://zenodo.org/api/iiif/record:6856934/manifest", "self_iiif_sequence": "https://zenodo.org/api/iiif/record:6856934/sequence/default", "versions": "https://zenodo.org/api/records/6856934/versions" }, "media_files": { "count": 0, "enabled": false, "entries": {}, "order": [], "total_bytes": 0 }, "metadata": { "additional_descriptions": [ { "description": "For more details, please refer to [1].\n\nWhen using this dataset in research work, please cite [1].\n\n \n\n[1] A.Droby, D. Vasyutinsky Shapira, I. Rabaev, B. Kurar Barakat, and J. El-Sana. Hard and Soft Labeling for Hebrew Paleography: A Case Study. Accepted to the 15th IAPR International Workshop on Document Analysis System (https://das2022.univ-lr.fr/index.php/)", "type": { "id": "notes", "title": { "de": "Anmerkungen", "en": "Notes" } } } ], "creators": [ { "affiliations": [ { "name": "Ben-Gurion University of the Negev, Beer-Sheva, Israel" } ], "person_or_org": { "family_name": "Ahmad Droby", "identifiers": [ { "identifier": "0000-0001-8458-1022", "scheme": "orcid" } ], "name": "Ahmad Droby", "type": "personal" } }, { "affiliations": [ { "name": "Ben-Gurion University of the Negev, Beer-Sheva, Israel" } ], "person_or_org": { "family_name": "Daria Vasyutinsky Shapira", "identifiers": [ { "identifier": "0000-0002-7240-7286", "scheme": "orcid" } ], "name": "Daria Vasyutinsky Shapira", "type": "personal" } }, { "affiliations": [ { "name": "Shamoon College of Engineering, Beer Sheva, 84100, Israel" } ], "person_or_org": { "family_name": "Irina Rabaev", "identifiers": [ { "identifier": "0000-0002-8542-8342", "scheme": "orcid" } ], "name": "Irina Rabaev", "type": "personal" } }, { "affiliations": [ { "name": "Ben-Gurion University of the Negev, Beer-Sheva, Israel" } ], "person_or_org": { "family_name": "Berat Kurar Bakarat", "identifiers": [ { "identifier": "0000-0002-7240-7286", "scheme": "orcid" } ], "name": "Berat Kurar Bakarat", "type": "personal" } }, { "affiliations": [ { "name": "Ben-Gurion University of the Negev, Beer-Sheva, Israel" } ], "person_or_org": { "family_name": "Jihad El-Sana", "identifiers": [ { "identifier": "0000-0002-1164-7040", "scheme": "orcid" } ], "name": "Jihad El-Sana", "type": "personal" } } ], "description": "
The VML-HP-ext collection contains 715 page images excerpted from 171 different manuscripts covering 14 medieval writing Hebrew styles, accompanied by their hard and soft GT labels.
\n\n We also provide the official split of the VML-HP-ext into training, typical test, and blind test sets.
\nThe typical test set includes unseen pages of the manuscripts from the training set. While training and typical test sets are disjoint on the page level, they do share the same set of manuscripts. Therefore, we also provide the blind test set, which consists of manuscripts that do not appear in the training set. The blind test set imitates a real-life scenario, where scholars would like to obtain a classification for a previously unseen document.
In this version, several labels were corrected.
", "publication_date": "2022-03-27", "publisher": "Zenodo", "resource_type": { "id": "dataset", "title": { "de": "Datensatz", "en": "Dataset" } }, "rights": [ { "description": { "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited." }, "icon": "cc-by-icon", "id": "cc-by-4.0", "props": { "scheme": "spdx", "url": "https://creativecommons.org/licenses/by/4.0/legalcode" }, "title": { "en": "Creative Commons Attribution 4.0 International" } } ], "subjects": [ { "subject": "Medieval Hebrew Manuscripts" }, { "subject": "Script Type Classification" }, { "subject": "Digital Paleography" }, { "subject": "Hard And Soft-labeling" } ], "title": "VMP_HP-ext_2" }, "parent": { "access": { "owned_by": { "user": 84438 } }, "communities": {}, "id": "6387470", "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.6387470", "provider": "datacite" } } }, "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.6856934", "provider": "datacite" }, "oai": { "identifier": "oai:zenodo.org:6856934", "provider": "oai" } }, "revision_id": 2, "stats": { "all_versions": { "data_volume": 83851136335.0, "downloads": 39, "unique_downloads": 33, "unique_views": 533, "views": 551 }, "this_version": { "data_volume": 43049463500.0, "downloads": 20, "unique_downloads": 15, "unique_views": 244, "views": 246 } }, "status": "published", "updated": "2022-07-19T01:49:54.564452+00:00", "versions": { "index": 2, "is_latest": true } }