{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2026-06-22T15:02:03.290349+00:00",
  "custom_fields": {},
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 2,
    "enabled": true,
    "entries": {
      "FAS_SMIDGE_DailyMail_2021_sample_20 words_150k.xlsx": {
        "access": {
          "hidden": false
        },
        "checksum": "md5:edcdd07cfd8f82e05fb1118462c26a7f",
        "ext": "xlsx",
        "id": "d88ac131-c863-42e7-8ede-a605c08f996f",
        "key": "FAS_SMIDGE_DailyMail_2021_sample_20 words_150k.xlsx",
        "links": {
          "content": "https://zenodo.org/api/records/20799370/files/FAS_SMIDGE_DailyMail_2021_sample_20%20words_150k.xlsx/content",
          "self": "https://zenodo.org/api/records/20799370/files/FAS_SMIDGE_DailyMail_2021_sample_20%20words_150k.xlsx"
        },
        "metadata": {},
        "mimetype": "application/octet-stream",
        "size": 40005517,
        "storage_class": "L"
      },
      "SMIDGE_Metadata template_DailyMail.docx": {
        "access": {
          "hidden": false
        },
        "checksum": "md5:614aac818cce5a16ac8f0d1278708f7d",
        "ext": "docx",
        "id": "21390f42-19f8-4319-9642-894b6b01e292",
        "key": "SMIDGE_Metadata template_DailyMail.docx",
        "links": {
          "content": "https://zenodo.org/api/records/20799370/files/SMIDGE_Metadata%20template_DailyMail.docx/content",
          "self": "https://zenodo.org/api/records/20799370/files/SMIDGE_Metadata%20template_DailyMail.docx"
        },
        "metadata": {},
        "mimetype": "application/octet-stream",
        "size": 105517,
        "storage_class": "L"
      }
    },
    "order": [],
    "total_bytes": 40111034
  },
  "id": "20799370",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/20799370/access",
    "access_grants": "https://zenodo.org/api/records/20799370/access/grants",
    "access_links": "https://zenodo.org/api/records/20799370/access/links",
    "access_request": "https://zenodo.org/api/records/20799370/access/request",
    "access_users": "https://zenodo.org/api/records/20799370/access/users",
    "archive": "https://zenodo.org/api/records/20799370/files-archive",
    "archive_media": "https://zenodo.org/api/records/20799370/media-files-archive",
    "communities": "https://zenodo.org/api/records/20799370/communities",
    "communities-suggestions": "https://zenodo.org/api/records/20799370/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.20799370",
    "draft": "https://zenodo.org/api/records/20799370/draft",
    "file_modification": "https://zenodo.org/api/records/20799370/file-modification",
    "files": "https://zenodo.org/api/records/20799370/files",
    "latest": "https://zenodo.org/api/records/20799370/versions/latest",
    "latest_html": "https://zenodo.org/records/20799370/latest",
    "media_files": "https://zenodo.org/api/records/20799370/media-files",
    "parent": "https://zenodo.org/api/records/20796242",
    "parent_doi": "https://doi.org/10.5281/zenodo.20796242",
    "parent_doi_html": "https://zenodo.org/doi/10.5281/zenodo.20796242",
    "parent_html": "https://zenodo.org/records/20796242",
    "preview_html": "https://zenodo.org/records/20799370?preview=1",
    "quota_increase": "https://zenodo.org/api/records/20799370/quota-increase",
    "request_deletion": "https://zenodo.org/api/records/20799370/request-deletion",
    "requests": "https://zenodo.org/api/records/20799370/requests",
    "reserve_doi": "https://zenodo.org/api/records/20799370/draft/pids/doi",
    "self": "https://zenodo.org/api/records/20799370",
    "self_doi": "https://doi.org/10.5281/zenodo.20799370",
    "self_doi_html": "https://zenodo.org/doi/10.5281/zenodo.20799370",
    "self_html": "https://zenodo.org/records/20799370",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:20799370/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:20799370/sequence/default",
    "versions": "https://zenodo.org/api/records/20799370/versions"
  },
  "media_files": {
    "count": 0,
    "enabled": false,
    "entries": {},
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "creators": [
      {
        "affiliations": [
          {
            "name": "FASresearch GmbH"
          }
        ],
        "person_or_org": {
          "family_name": "Gulas",
          "given_name": "Christian",
          "identifiers": [
            {
              "identifier": "0000-0002-9065-7641",
              "scheme": "orcid"
            }
          ],
          "name": "Gulas, Christian",
          "type": "personal"
        },
        "role": {
          "id": "contactperson",
          "title": {
            "de": "Kontaktperson",
            "en": "Contact person"
          }
        }
      }
    ],
    "description": "<p class=\"MsoNormal\"><span>The dataset of user comments was sourced from the online platform of the Daily Mail. A custom Python-based web scraping tool was developed to systematically extract data from articles published during the calendar year 2021. This initial process retrieved a comprehensive corpus of 224,981 articles and successfully downloaded over 41 million associated user comments. For each comment, relevant metadata was collected, including the comment text, user ID, timestamp, and community feedback metrics such as positive and negative votes.</span></p>\n<p class=\"MsoNormal\"><span>The dataset provided for analysis is a&nbsp;random sample of 150,000 user comments&nbsp;drawn from this extensive 2021 collection. To ensure the suitability of the data for in-depth textual analysis, a filtering criterion was applied to the sampling process. The resulting sample exclusively contains comments with a minimum length of&nbsp;at least 20 words. This step was implemented to isolate more substantive comments, making the dataset particularly well-suited for further analytical tasks such as topic modeling, sentiment analysis, and detailed qualitative examination.</span></p>\n<p class=\"MsoNormal\"><span>Column description:</span></p>\n<p class=\"FAS1CxSpFirst\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>RowID: Sequential row identifier within the exported dataset.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>AssetId: Identifier of the Daily Mail article to which the comment belongs.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>category: Content category/section of the article (e.g. news, sport, femail, tvshowbiz).</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>custom_id: Unique identifier of the comment.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>AssetHeadline: Headline/title of the article.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>DateCreated: Date and time when the comment was created; stored in the file as a numeric date value.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>AssetCommentCount: Total number of comments associated with the article.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>AssetUrl: URL path of the corresponding Daily Mail article.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>message: Full text of the user comment.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>year: Year of publication/collection of the comment (2021).</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>VoteCount: Total number of votes received by the comment.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>VoteRating: Net rating of the comment, calculated as positive votes minus negative votes.</span></p>\n<p class=\"FAS1CxSpMiddle\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>pos_votes: Number of positive votes received by the comment.</span></p>\n<p class=\"FAS1CxSpLast\"><span><span>&middot;<span>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><span>neg_votes: Number of negative votes received by the comment.</span></p>",
    "funding": [
      {
        "award": {
          "acronym": "SMIDGE",
          "id": "00k4n6c32::101095290",
          "identifiers": [
            {
              "identifier": "https://cordis.europa.eu/projects/101095290",
              "scheme": "url"
            }
          ],
          "number": "101095290",
          "program": "HORIZON.2.2",
          "title": {
            "en": "Social Media narratives: addressing extremism in middle age"
          }
        },
        "funder": {
          "id": "00k4n6c32",
          "name": "European Commission"
        }
      }
    ],
    "publication_date": "2026-06-22",
    "publisher": "Zenodo",
    "related_identifiers": [
      {
        "identifier": "10.5281/zenodo.18847300",
        "relation_type": {
          "id": "ispublishedin",
          "title": {
            "de": "Ist ver\u00f6ffentlicht in",
            "en": "Is published in"
          }
        },
        "resource_type": {
          "id": "publication-deliverable",
          "title": {
            "de": "Projektergebnis",
            "en": "Project deliverable"
          }
        },
        "scheme": "doi"
      }
    ],
    "resource_type": {
      "id": "dataset",
      "title": {
        "de": "Datensatz",
        "en": "Dataset"
      }
    },
    "rights": [
      {
        "description": {
          "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited."
        },
        "icon": "cc-by-icon",
        "id": "cc-by-4.0",
        "props": {
          "scheme": "spdx",
          "url": "https://creativecommons.org/licenses/by/4.0/legalcode"
        },
        "title": {
          "en": "Creative Commons Attribution 4.0 International"
        }
      }
    ],
    "title": "SMIDGE Daily Mail comments dataset"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "1121522"
      },
      "settings": {
        "accept_conditions_text": null,
        "allow_guest_requests": false,
        "allow_user_requests": false,
        "secret_link_expiration": 0
      }
    },
    "communities": {
      "default": "5e04626c-e7a3-4718-bde5-7b20d2c925bd",
      "entries": [
        {
          "access": {
            "member_policy": "open",
            "members_visibility": "public",
            "record_submission_policy": "closed",
            "review_policy": "members",
            "visibility": "public"
          },
          "children": {
            "allow": false
          },
          "created": "2024-06-07T07:00:39.613907+00:00",
          "custom_fields": {
            "subjects": [
              {
                "id": "euroscivoc:299"
              },
              {
                "id": "euroscivoc:93"
              },
              {
                "id": "euroscivoc:30020"
              },
              {
                "id": "euroscivoc:103"
              },
              {
                "id": "euroscivoc:105"
              },
              {
                "id": "euroscivoc:89"
              },
              {
                "id": "euroscivoc:47"
              },
              {
                "id": "euroscivoc:575"
              }
            ]
          },
          "deletion_status": {
            "is_deleted": false,
            "status": "P"
          },
          "id": "5e04626c-e7a3-4718-bde5-7b20d2c925bd",
          "links": {},
          "metadata": {
            "curation_policy": "",
            "description": "The SMIDGE project will analyse conspiracy theories, misinformation, extremist narratives in Europe. Grant agreement ID: 101095290",
            "organizations": [
              {
                "id": "035b05819"
              },
              {
                "id": "0312pnr83"
              },
              {
                "id": "037wrv551"
              },
              {
                "name": "University of Central Lancashire, Cyprus"
              },
              {
                "name": "Inclusive Europe"
              },
              {
                "id": "00wjc7c48"
              },
              {
                "name": "FAS Research"
              },
              {
                "name": "Fondazione Villa Montesca"
              }
            ],
            "title": "SMIDGE: Social Media narratives: addressing extremism in middle age",
            "type": {
              "id": "project"
            },
            "website": "https://www.smidgeproject.eu/"
          },
          "revision_id": 7,
          "slug": "smidge",
          "updated": "2026-06-22T12:09:52.682198+00:00"
        }
      ],
      "ids": [
        "5e04626c-e7a3-4718-bde5-7b20d2c925bd"
      ]
    },
    "id": "20796242",
    "pids": {
      "doi": {
        "client": "datacite",
        "identifier": "10.5281/zenodo.20796242",
        "provider": "datacite"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.20799370",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:20799370",
      "provider": "oai"
    }
  },
  "revision_id": 4,
  "stats": {
    "all_versions": {
      "data_volume": 481753068.0,
      "downloads": 28,
      "unique_downloads": 25,
      "unique_views": 66,
      "views": 72
    },
    "this_version": {
      "data_volume": 320888272.0,
      "downloads": 16,
      "unique_downloads": 15,
      "unique_views": 29,
      "views": 32
    }
  },
  "status": "published",
  "swh": {},
  "updated": "2026-06-22T15:02:03.450221+00:00",
  "versions": {
    "index": 3,
    "is_latest": true
  }
}