{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2021-09-02T15:21:49.172864+00:00",
  "custom_fields": {},
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 4,
    "enabled": true,
    "entries": {
      "benchmark.json": {
        "checksum": "md5:e1080d051298444befa1014d4fa7bda0",
        "ext": "json",
        "id": "f2af322b-5a77-4a84-8d1c-13d947713e22",
        "key": "benchmark.json",
        "metadata": null,
        "mimetype": "application/json",
        "size": 4169673
      },
      "eval-index.jsonl": {
        "checksum": "md5:39f504c8d64f261b7862e3917aa259f7",
        "ext": "bin",
        "id": "15c78217-d7cd-4706-b423-49805f18a70b",
        "key": "eval-index.jsonl",
        "metadata": null,
        "mimetype": "application/octet-stream",
        "size": 632582
      },
      "predictions-annotated.json": {
        "checksum": "md5:a50ad18a28bf8d1d750afba51118f00e",
        "ext": "json",
        "id": "6a18d1b0-60a4-40c5-be13-b91cee6b41b5",
        "key": "predictions-annotated.json",
        "metadata": null,
        "mimetype": "application/json",
        "size": 6392629
      },
      "train-index.jsonl": {
        "checksum": "md5:cfd046716905235ee8f7139ee4ee240f",
        "ext": "bin",
        "id": "76f719f0-a616-40ac-92f8-c3d1d63fe8ce",
        "key": "train-index.jsonl",
        "metadata": null,
        "mimetype": "application/octet-stream",
        "size": 5692261
      }
    },
    "order": [],
    "total_bytes": 16887145
  },
  "id": "5384768",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/5384768/access",
    "access_grants": "https://zenodo.org/api/records/5384768/access/grants",
    "access_links": "https://zenodo.org/api/records/5384768/access/links",
    "access_request": "https://zenodo.org/api/records/5384768/access/request",
    "access_users": "https://zenodo.org/api/records/5384768/access/users",
    "archive": "https://zenodo.org/api/records/5384768/files-archive",
    "archive_media": "https://zenodo.org/api/records/5384768/media-files-archive",
    "communities": "https://zenodo.org/api/records/5384768/communities",
    "communities-suggestions": "https://zenodo.org/api/records/5384768/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.5384768",
    "draft": "https://zenodo.org/api/records/5384768/draft",
    "files": "https://zenodo.org/api/records/5384768/files",
    "latest": "https://zenodo.org/api/records/5384768/versions/latest",
    "latest_html": "https://zenodo.org/records/5384768/latest",
    "media_files": "https://zenodo.org/api/records/5384768/media-files",
    "parent": "https://zenodo.org/api/records/5384767",
    "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.5384767",
    "parent_html": "https://zenodo.org/records/5384767",
    "requests": "https://zenodo.org/api/records/5384768/requests",
    "reserve_doi": "https://zenodo.org/api/records/5384768/draft/pids/doi",
    "self": "https://zenodo.org/api/records/5384768",
    "self_doi": "https://zenodo.org/doi/10.5281/zenodo.5384768",
    "self_html": "https://zenodo.org/records/5384768",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:5384768/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:5384768/sequence/default",
    "versions": "https://zenodo.org/api/records/5384768/versions"
  },
  "media_files": {
    "count": 0,
    "enabled": false,
    "entries": {},
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "creators": [
      {
        "affiliations": [
          {
            "name": "Nokia Bell Labs"
          }
        ],
        "person_or_org": {
          "family_name": "Heyman",
          "given_name": "Geert",
          "identifiers": [
            {
              "identifier": "0000-0001-6276-424X",
              "scheme": "orcid"
            }
          ],
          "name": "Heyman, Geert",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "Nokia Bell Labs"
          }
        ],
        "person_or_org": {
          "family_name": "Huysegems",
          "given_name": "Rafeal",
          "identifiers": [
            {
              "identifier": "0000-0001-6244-9864",
              "scheme": "orcid"
            }
          ],
          "name": "Huysegems, Rafeal",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "Nokia Bell Labs"
          }
        ],
        "person_or_org": {
          "family_name": "Justen",
          "given_name": "Pascal",
          "name": "Justen, Pascal",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "Nokia Bell Labs"
          }
        ],
        "person_or_org": {
          "family_name": "Van Cutsem",
          "given_name": "Tom",
          "identifiers": [
            {
              "identifier": "0000-0003-4116-4290",
              "scheme": "orcid"
            }
          ],
          "name": "Van Cutsem, Tom",
          "type": "personal"
        }
      }
    ],
    "description": "<p>In this dataset you find the&nbsp;user study data that was used in the <strong><em>Natural Language-Guided Programming</em></strong> paper, which is accepted for Onward! 2021. A preprint can be found here&nbsp;<a href=\"https://arxiv.org/pdf/2108.05198.pdf\">https://arxiv.org/pdf/2108.05198.pdf</a>. The dataset consists of the following files:</p>\n\n<ul>\n\t<li>\n\t<p>benchmark.json contains 201 test cases. Each test case consists of context, a natural language intent and target code. The test cases are intended to evaluate a model that can predict code giving a piece of context code and a natural language intent. The test cases were derived from Jupyter notebooks that were crawled from Github projects with permissive licenses. In the project_metadata field you find information about the original project such as its git url&nbsp;and&nbsp;license.</p>\n\t</li>\n\t<li>\n\t<p>predictions-annotated.json contains predictions of the three models used in the paper for 100 test cases in benchmark.json. Each prediction is accompanied with qualitive assesments from three annotators.</p>\n\t</li>\n\t<li>\n\t<p>train-index.jsonl is the list of github projects that were used for training the models.</p>\n\t</li>\n\t<li>\n\t<p>eval-index.jsonl is a list of github projects that we kept separate for evaluation. The benchmark.json was created from a random subset of the projects in this list.</p>\n\t</li>\n</ul>\n\n<p>For more details we refer to the paper.</p>",
    "publication_date": "2021-09-02",
    "publisher": "Zenodo",
    "resource_type": {
      "id": "dataset",
      "title": {
        "de": "Datensatz",
        "en": "Dataset"
      }
    },
    "rights": [
      {
        "description": {
          "en": ""
        },
        "id": "bsd-3-clause",
        "props": {
          "scheme": "spdx",
          "url": "https://opensource.org/licenses/BSD-3-Clause"
        },
        "title": {
          "en": "BSD 3-Clause \"New\" or \"Revised\" License"
        }
      }
    ],
    "subjects": [
      {
        "subject": "code completion"
      },
      {
        "subject": "code prediction"
      },
      {
        "subject": "natural language-guided programming"
      },
      {
        "subject": "example-centric programming"
      }
    ],
    "title": "Natural Language-Guided Programming User Study",
    "version": "0.0.1"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "124380"
      }
    },
    "communities": {},
    "id": "5384767",
    "pids": {
      "doi": {
        "client": "datacite",
        "identifier": "10.5281/zenodo.5384767",
        "provider": "datacite"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.5384768",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:5384768",
      "provider": "oai"
    }
  },
  "revision_id": 3,
  "stats": {
    "all_versions": {
      "data_volume": 248929049.0,
      "downloads": 59,
      "unique_downloads": 30,
      "unique_views": 303,
      "views": 340
    },
    "this_version": {
      "data_volume": 248929049.0,
      "downloads": 59,
      "unique_downloads": 30,
      "unique_views": 302,
      "views": 339
    }
  },
  "status": "published",
  "updated": "2021-09-03T01:48:40.556163+00:00",
  "versions": {
    "index": 1,
    "is_latest": true
  }
}