Dataset Open Access

DIRE: A Neural Approach to Decompiled Identifier Naming

Lacomis, Jeremy; Yin, Pengcheng; Schwartz, Edward J.; Allamanis, Miltiadis; Le Goues, Claire; Neubig, Graham; Vasilescu, Bogdan


DataCite XML Export

<?xml version='1.0' encoding='utf-8'?>
<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4" xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.1/metadata.xsd">
  <identifier identifierType="DOI">10.5281/zenodo.3403078</identifier>
  <creators>
    <creator>
      <creatorName>Lacomis, Jeremy</creatorName>
      <givenName>Jeremy</givenName>
      <familyName>Lacomis</familyName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0003-0653-5738</nameIdentifier>
      <affiliation>Carnegie Mellon University</affiliation>
    </creator>
    <creator>
      <creatorName>Yin, Pengcheng</creatorName>
      <givenName>Pengcheng</givenName>
      <familyName>Yin</familyName>
      <affiliation>Carnegie Mellon University</affiliation>
    </creator>
    <creator>
      <creatorName>Schwartz, Edward J.</creatorName>
      <givenName>Edward J.</givenName>
      <familyName>Schwartz</familyName>
      <affiliation>Carnegie Mellon University Software Engineering Institute</affiliation>
    </creator>
    <creator>
      <creatorName>Allamanis, Miltiadis</creatorName>
      <givenName>Miltiadis</givenName>
      <familyName>Allamanis</familyName>
      <affiliation>Microsoft Research</affiliation>
    </creator>
    <creator>
      <creatorName>Le Goues, Claire</creatorName>
      <givenName>Claire</givenName>
      <familyName>Le Goues</familyName>
      <affiliation>Carnegie Mellon University</affiliation>
    </creator>
    <creator>
      <creatorName>Neubig, Graham</creatorName>
      <givenName>Graham</givenName>
      <familyName>Neubig</familyName>
      <affiliation>Carnegie Mellon University</affiliation>
    </creator>
    <creator>
      <creatorName>Vasilescu, Bogdan</creatorName>
      <givenName>Bogdan</givenName>
      <familyName>Vasilescu</familyName>
      <affiliation>Carnegie Mellon University</affiliation>
    </creator>
  </creators>
  <titles>
    <title>DIRE: A Neural Approach to Decompiled Identifier Naming</title>
  </titles>
  <publisher>Zenodo</publisher>
  <publicationYear>2019</publicationYear>
  <dates>
    <date dateType="Issued">2019-09-09</date>
  </dates>
  <resourceType resourceTypeGeneral="Dataset"/>
  <alternateIdentifiers>
    <alternateIdentifier alternateIdentifierType="url">https://zenodo.org/record/3403078</alternateIdentifier>
  </alternateIdentifiers>
  <relatedIdentifiers>
    <relatedIdentifier relatedIdentifierType="DOI" relationType="IsVersionOf">10.5281/zenodo.3403077</relatedIdentifier>
  </relatedIdentifiers>
  <rightsList>
    <rights rightsURI="https://opensource.org/licenses/MIT">MIT License</rights>
    <rights rightsURI="info:eu-repo/semantics/openAccess">Open Access</rights>
  </rightsList>
  <descriptions>
    <description descriptionType="Abstract">&lt;p&gt;This dataset is released as a companion to the paper &amp;quot;DIRE: A Neural Approach to Decompiled Identifier Naming&amp;quot;, appearing in the proceedings of the&amp;nbsp;34th IEEE/ACM International Conference on Automated Software Engineering (ASE 2019).&lt;/p&gt;

&lt;p&gt;It contains information generated by decompiling 3,195,962 functions found in 164,632 unique binaries generated from C code scraped from GitHub. For practicality, the dataset is partitioned into 16 archives by the first hexadecimal digit of the SHA-256 hash of the binary used to generate it. Each of the 16 archives contains approximately 10,000&amp;nbsp;JSONL files, named according to a binary&amp;#39;s hash. Each JSONL file consists of a single JSON object per-line corresponding to a single function in the decompiled binary.&lt;/p&gt;

&lt;p&gt;Archives are provided in both GZIP and BZIP2 format.&lt;/p&gt;

&lt;p&gt;See the README file for more information.&lt;/p&gt;</description>
  </descriptions>
</resource>
546
5,059
views
downloads
All versions This version
Views 546546
Downloads 5,0595,059
Data volume 846.1 GB846.1 GB
Unique views 482482
Unique downloads 347347

Share

Cite as