Dataset Open Access

Hacker News Curated Comments Dataset

Christopher Moody

MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="">
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u"></subfield>
    <subfield code="a">Creative Commons Zero v1.0 Universal</subfield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2016-02-10</subfield>
  <controlfield tag="005">20200124192545.0</controlfield>
  <controlfield tag="001">45901</controlfield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="p">openaire_data</subfield>
    <subfield code="o"></subfield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;A curated dataset from&amp;nbsp;fh-bigquery:hackernews.stories&lt;/p&gt;

&lt;p&gt;Only HN stories with more than 10 comments are included, and only comments from users with more than 10 comments are included.&lt;/p&gt;</subfield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">780573044</subfield>
    <subfield code="z">md5:1900b83d663a9cf2f34fd9d42fdb3846</subfield>
    <subfield code="u"></subfield>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">dataset</subfield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="u">Stitch Fix</subfield>
    <subfield code="a">Christopher Moody</subfield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">hacker news, topic models, text, nlp</subfield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.5281/zenodo.45901</subfield>
    <subfield code="2">doi</subfield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">Hacker News Curated Comments Dataset</subfield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2"></subfield>
All versions This version
Views 44,52444,513
Downloads 83,83583,803
Data volume 65.4 TB65.4 TB
Unique views 41,48141,470
Unique downloads 62,05862,032


Cite as