Dataset Open Access

Webis Abstractive Snippet Corpus 2020

Chen ,Wei-Fan; Syed, Shahbaz; Potthast, Martin; Hagen, Matthias; Stein, Benno


MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="http://www.loc.gov/MARC21/slim">
  <leader>00000nmm##2200000uu#4500</leader>
  <datafield tag="041" ind1=" " ind2=" ">
    <subfield code="a">eng</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">abstractive snippet</subfield>
  </datafield>
  <controlfield tag="005">20200302151041.0</controlfield>
  <controlfield tag="001">3653834</controlfield>
  <datafield tag="711" ind1=" " ind2=" ">
    <subfield code="d">20-24 April, 2020</subfield>
    <subfield code="g">WWW20</subfield>
    <subfield code="a">The Web Conference 2020</subfield>
    <subfield code="c">Taipei, Taiwan</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Leipzig University</subfield>
    <subfield code="a">Syed, Shahbaz</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Leipzig University</subfield>
    <subfield code="0">(orcid)0000-0003-2451-0665</subfield>
    <subfield code="a">Potthast, Martin</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Martin-Luther-Universität Halle-Wittenberg</subfield>
    <subfield code="0">(orcid)0000-0002-9733-2890</subfield>
    <subfield code="a">Hagen, Matthias</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Bauhaus-Universität Weimar</subfield>
    <subfield code="0">(orcid)0000-0001-9033-2217</subfield>
    <subfield code="a">Stein, Benno</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">4252964846</subfield>
    <subfield code="z">md5:41696d93df837a53f871c0e402eb0a22</subfield>
    <subfield code="u">https://zenodo.org/record/3653834/files/released-snippet-ac-qb.zip</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">6631607911</subfield>
    <subfield code="z">md5:f36a9c50a117d5bee91831b4a23c7bb0</subfield>
    <subfield code="u">https://zenodo.org/record/3653834/files/released-snippet-ac.zip</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">23224318</subfield>
    <subfield code="z">md5:ed30087f82080000ac5e67b23a8d8c98</subfield>
    <subfield code="u">https://zenodo.org/record/3653834/files/released-snippet-dmoz-qb.zip</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">244438672</subfield>
    <subfield code="z">md5:511694a7c9e4794364eaff89838e0039</subfield>
    <subfield code="u">https://zenodo.org/record/3653834/files/released-snippet-dmoz.zip</subfield>
  </datafield>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2020-02-07</subfield>
  </datafield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="p">openaire_data</subfield>
    <subfield code="p">user-webis</subfield>
    <subfield code="o">oai:zenodo.org:3653834</subfield>
  </datafield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="u">Paderborn University</subfield>
    <subfield code="0">(orcid)0000-0003-3400-6075</subfield>
    <subfield code="a">Chen ,Wei-Fan</subfield>
  </datafield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">Webis Abstractive Snippet Corpus 2020</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-webis</subfield>
  </datafield>
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u">https://creativecommons.org/licenses/by/4.0/legalcode</subfield>
    <subfield code="a">Creative Commons Attribution 4.0 International</subfield>
  </datafield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2">opendefinition.org</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;The Webis Abstractive Snippet 2020 (Webis-Snippete-20) comprises four abstractive snippet dataset from ClueWeb09, Clueweb12, and DMOZ descriptions. More than 10 million &amp;lt;webpage, abstractive snippet&amp;gt; pairs / 3.5 million &amp;lt;query, webpage, abstractive snippet&amp;gt; pairs were collected.&lt;/p&gt;</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">isVersionOf</subfield>
    <subfield code="a">10.5281/zenodo.3653833</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.5281/zenodo.3653834</subfield>
    <subfield code="2">doi</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">dataset</subfield>
  </datafield>
</record>
820
2,699
views
downloads
All versions This version
Views 820820
Downloads 2,6992,699
Data volume 10.8 TB10.8 TB
Unique views 735735
Unique downloads 365365

Share

Cite as