Dataset Open Access

A Dataset of Pull Requests and A Trained Random Forest Model for predicting Pull Request Acceptance

Tapajit Dey; Audris Mockus


JSON Export

{
  "files": [
    {
      "links": {
        "self": "https://zenodo.org/api/files/4e849a51-1a85-4d9e-b87d-55c087e3a82d/Curated_Pull_Request_Data.csv"
      }, 
      "checksum": "md5:9ba00c622679e3ae6d2ff12bde44e3e7", 
      "bucket": "4e849a51-1a85-4d9e-b87d-55c087e3a82d", 
      "key": "Curated_Pull_Request_Data.csv", 
      "type": "csv", 
      "size": 35811600
    }, 
    {
      "links": {
        "self": "https://zenodo.org/api/files/4e849a51-1a85-4d9e-b87d-55c087e3a82d/description.pdf"
      }, 
      "checksum": "md5:4c5c559bb644f3e2c991d71dc19932b5", 
      "bucket": "4e849a51-1a85-4d9e-b87d-55c087e3a82d", 
      "key": "description.pdf", 
      "type": "pdf", 
      "size": 40352
    }, 
    {
      "links": {
        "self": "https://zenodo.org/api/files/4e849a51-1a85-4d9e-b87d-55c087e3a82d/PRMODEL.Rdata"
      }, 
      "checksum": "md5:ba1eb93c488e1090ab051901aeb370f2", 
      "bucket": "4e849a51-1a85-4d9e-b87d-55c087e3a82d", 
      "key": "PRMODEL.Rdata", 
      "type": "rdata", 
      "size": 258433749
    }, 
    {
      "links": {
        "self": "https://zenodo.org/api/files/4e849a51-1a85-4d9e-b87d-55c087e3a82d/snippet.R"
      }, 
      "checksum": "md5:5cf376f3114ce94edf9e16fddaa50185", 
      "bucket": "4e849a51-1a85-4d9e-b87d-55c087e3a82d", 
      "key": "snippet.R", 
      "type": "r", 
      "size": 841
    }
  ], 
  "owners": [
    90284
  ], 
  "doi": "10.5281/zenodo.3858046", 
  "stats": {
    "version_unique_downloads": 32.0, 
    "unique_views": 43.0, 
    "views": 54.0, 
    "version_views": 57.0, 
    "unique_downloads": 32.0, 
    "version_unique_views": 43.0, 
    "volume": 2251698451.0, 
    "version_downloads": 55.0, 
    "downloads": 54.0, 
    "version_volume": 2251738803.0
  }, 
  "links": {
    "doi": "https://doi.org/10.5281/zenodo.3858046", 
    "conceptdoi": "https://doi.org/10.5281/zenodo.3858032", 
    "bucket": "https://zenodo.org/api/files/4e849a51-1a85-4d9e-b87d-55c087e3a82d", 
    "conceptbadge": "https://zenodo.org/badge/doi/10.5281/zenodo.3858032.svg", 
    "html": "https://zenodo.org/record/3858046", 
    "latest_html": "https://zenodo.org/record/3858046", 
    "badge": "https://zenodo.org/badge/doi/10.5281/zenodo.3858046.svg", 
    "latest": "https://zenodo.org/api/records/3858046"
  }, 
  "conceptdoi": "10.5281/zenodo.3858032", 
  "created": "2020-05-26T19:53:07.512049+00:00", 
  "updated": "2020-07-20T16:50:43.456576+00:00", 
  "conceptrecid": "3858032", 
  "revision": 4, 
  "id": 3858046, 
  "metadata": {
    "access_right_category": "success", 
    "doi": "10.5281/zenodo.3858046", 
    "description": "<p>A Curated Dataset of 470,925 pull requests for 3349 popular NPM packages, description of the variables, code snippet for creating a Random Forest model for predicting pull request acceptance, and a pre-trained&nbsp;&nbsp;Random Forest model (in R). The dataset is for the ESEM-2020 paper: &quot;Impact of Technical and Social Factors on Pull Request Quality for the NPM Ecosystem&quot; (<a href=\"https://arxiv.org/abs/2007.04816\">https://arxiv.org/abs/2007.04816</a>)</p>", 
    "license": {
      "id": "CC-BY-4.0"
    }, 
    "title": "A Dataset of Pull Requests and A Trained Random Forest Model for predicting Pull Request Acceptance", 
    "relations": {
      "version": [
        {
          "count": 2, 
          "index": 1, 
          "parent": {
            "pid_type": "recid", 
            "pid_value": "3858032"
          }, 
          "is_last": true, 
          "last_child": {
            "pid_type": "recid", 
            "pid_value": "3858046"
          }
        }
      ]
    }, 
    "communities": [
      {
        "id": "woc"
      }
    ], 
    "keywords": [
      "Pull Request", 
      "Random Forest"
    ], 
    "publication_date": "2020-05-26", 
    "creators": [
      {
        "orcid": "0000-0002-1379-8539", 
        "affiliation": "University of Tennessee", 
        "name": "Tapajit Dey"
      }, 
      {
        "affiliation": "University of Tennessee", 
        "name": "Audris Mockus"
      }
    ], 
    "access_right": "open", 
    "resource_type": {
      "type": "dataset", 
      "title": "Dataset"
    }, 
    "related_identifiers": [
      {
        "scheme": "doi", 
        "identifier": "10.5281/zenodo.3858032", 
        "relation": "isVersionOf"
      }
    ]
  }
}
57
55
views
downloads
All versions This version
Views 5754
Downloads 5554
Data volume 2.3 GB2.3 GB
Unique views 4343
Unique downloads 3232

Share

Cite as