Dataset Open Access

DiscoWUG: Discovered Diachronic Word Usage Graphs for German

Kurtyigit, Sinan; Park, Maike; Schlechtweg, Dominik; Kuhn, Jonas; Schulte im Walde, Sabine


MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="http://www.loc.gov/MARC21/slim">
  <leader>00000nmm##2200000uu#4500</leader>
  <datafield tag="041" ind1=" " ind2=" ">
    <subfield code="a">deu</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">graded word meaning annotation</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">word usage graphs</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">diachronic usage relatedness</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">semantic change</subfield>
  </datafield>
  <controlfield tag="005">20211219014845.0</controlfield>
  <datafield tag="500" ind1=" " ind2=" ">
    <subfield code="a">additional DURel metrics and change scores</subfield>
  </datafield>
  <controlfield tag="001">5791125</controlfield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Leibniz-Institut für Deutsche Sprache</subfield>
    <subfield code="0">(orcid)0000-0001-8582-1462</subfield>
    <subfield code="a">Park, Maike</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">University of Stuttgart</subfield>
    <subfield code="0">(orcid)0000-0002-0685-2576</subfield>
    <subfield code="a">Schlechtweg, Dominik</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">University of Stuttgart</subfield>
    <subfield code="a">Kuhn, Jonas</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">University of Stuttgart</subfield>
    <subfield code="0">(orcid)0000-0002-8975-6255</subfield>
    <subfield code="a">Schulte im Walde, Sabine</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">15022804</subfield>
    <subfield code="z">md5:63d56739e306f68434c3cd015d2b8248</subfield>
    <subfield code="u">https://zenodo.org/record/5791125/files/discowug.zip</subfield>
  </datafield>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2021-12-15</subfield>
  </datafield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="p">openaire_data</subfield>
    <subfield code="p">user-historical_linguistics</subfield>
    <subfield code="p">user-wugs</subfield>
    <subfield code="o">oai:zenodo.org:5791125</subfield>
  </datafield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="u">University of Stuttgart</subfield>
    <subfield code="a">Kurtyigit, Sinan</subfield>
  </datafield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">DiscoWUG: Discovered Diachronic Word Usage Graphs for German</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-historical_linguistics</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-wugs</subfield>
  </datafield>
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u">https://creativecommons.org/licenses/by/4.0/legalcode</subfield>
    <subfield code="a">Creative Commons Attribution 4.0 International</subfield>
  </datafield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2">opendefinition.org</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;This data collection contains discovered diachronic Word Usage Graphs (WUGs) for German. Find a description of the data format, code to process the data and further datasets on the &lt;a href="https://www.ims.uni-stuttgart.de/data/wugs"&gt;WUGsite&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;Note:&lt;/p&gt;

&lt;ul&gt;
	&lt;li&gt;The date given for each word use does not correspond to the exact date of the document from which the use was sampled but only to the midpoint of the respective time period (1800-1899, 1946-1990), as the exact date was not available in the SemEval corpora.&lt;/li&gt;
&lt;/ul&gt;

&lt;p&gt;Please find more information on the provided data in the paper referenced below.&lt;/p&gt;

&lt;p&gt;Version: 1.1.0, 15.12.2021.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Reference&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;Sinan Kurtyigit, Maike Park, Dominik Schlechtweg, Jonas Kuhn, Sabine Schulte im Walde. 2021. &lt;a href="https://arxiv.org/abs/2106.03111"&gt;Lexical Semantic Change Discovery&lt;/a&gt;. Proceedings of the Joint Conference of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing.&lt;/p&gt;</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">isPublishedIn</subfield>
    <subfield code="a">10.18653/v1/2021.acl-long.543</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">continues</subfield>
    <subfield code="a">10.5281/zenodo.5541274</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">continues</subfield>
    <subfield code="a">10.5281/zenodo.5544198</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">isVersionOf</subfield>
    <subfield code="a">10.5281/zenodo.5544579</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.5281/zenodo.5791125</subfield>
    <subfield code="2">doi</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">dataset</subfield>
  </datafield>
</record>
143
14
views
downloads
All versions This version
Views 14361
Downloads 146
Data volume 210.2 MB90.1 MB
Unique views 12654
Unique downloads 146

Share

Cite as