Dataset Open Access

Statistics and Evaluation Data for Publication "Using Supervised Learning to Classify Metadata of Research Data by Discipline of Research"

Tobias Weber; Michael Fromm; Nelson Tavares de Sousa


DataCite XML Export

<?xml version='1.0' encoding='utf-8'?>
<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4" xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.1/metadata.xsd">
  <identifier identifierType="DOI">10.5281/zenodo.3490468</identifier>
  <creators>
    <creator>
      <creatorName>Tobias Weber</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0003-1815-7041</nameIdentifier>
      <affiliation>Leibniz Supercomputing Centre</affiliation>
    </creator>
    <creator>
      <creatorName>Michael Fromm</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0002-7244-4191</nameIdentifier>
      <affiliation>Database Systems Group, Ludwig-Maximilians-Universität München</affiliation>
    </creator>
    <creator>
      <creatorName>Nelson Tavares de Sousa</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0003-1866-7156</nameIdentifier>
      <affiliation>Software Engineering Group, Kiel University</affiliation>
    </creator>
  </creators>
  <titles>
    <title>Statistics and Evaluation Data for Publication "Using Supervised Learning to Classify Metadata of Research Data by Discipline of Research"</title>
  </titles>
  <publisher>Zenodo</publisher>
  <publicationYear>2019</publicationYear>
  <subjects>
    <subject>supervised machine learning</subject>
    <subject>multi-label classification</subject>
    <subject>research data</subject>
    <subject>text processing</subject>
    <subject>data science</subject>
    <subject>disciplines of research</subject>
    <subject subjectScheme="url">https://dewey.info/</subject>
    <subject subjectScheme="url">https://dewey.info/</subject>
  </subjects>
  <dates>
    <date dateType="Issued">2019-10-15</date>
  </dates>
  <resourceType resourceTypeGeneral="Dataset"/>
  <alternateIdentifiers>
    <alternateIdentifier alternateIdentifierType="url">https://zenodo.org/record/3490468</alternateIdentifier>
  </alternateIdentifiers>
  <relatedIdentifiers>
    <relatedIdentifier relatedIdentifierType="DOI" relationType="IsVersionOf">10.5281/zenodo.3490467</relatedIdentifier>
    <relatedIdentifier relatedIdentifierType="URL" relationType="IsPartOf">https://zenodo.org/communities/zenodo</relatedIdentifier>
  </relatedIdentifiers>
  <rightsList>
    <rights rightsURI="http://creativecommons.org/licenses/by/4.0/legalcode">Creative Commons Attribution 4.0 International</rights>
    <rights rightsURI="info:eu-repo/semantics/openAccess">Open Access</rights>
  </rightsList>
  <descriptions>
    <description descriptionType="Abstract">&lt;p&gt;Automated classification of metadata of research data by their discipline(s) of research can be used in scientometric research, by repository service providers, and in the context of research data aggregation services. Openly available metadata of the DataCite index for research data were used to compile a large training and evaluation set comprised of 609,524 records. This publication contains aggregated data for the paper. It also contains the evaluation data of all model/hyper-parameter training and test runs.&lt;/p&gt;</description>
  </descriptions>
</resource>
544
77
views
downloads
All versions This version
Views 544544
Downloads 7778
Data volume 7.0 MB7.1 MB
Unique views 432432
Unique downloads 7374

Share

Cite as