<?xml version='1.0' encoding='utf-8'?>
<oai_dc:dc xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
  <dc:creator>Anonymous Authors</dc:creator>
  <dc:date>2022-01-05</dc:date>
  <dc:description>&amp;lt;p&amp;gt;This repository holds the Clarity Dataset which is a companion to the SANER&amp;#39;22 entitled &amp;quot;An Empirical Investigation into the Use of Image Captioning for Automated Software Documentation&amp;quot;. The dataset consists of 45,998 captions&amp;nbsp;10,204 GUI screenshots and xml metadata files (akin to the &amp;quot;html&amp;quot; for stipulating GUIs)&amp;nbsp;of Android applications.&amp;nbsp;The NL captions were obtained from human labelers, underwent several quality control mechanisms, and contain both high- (screen-level) and low-(component)&amp;nbsp;level descriptions of screen functionality. This dataset is meant as a new source of data to augment techniques for software documentation that can take advantage of the rich pixel-based information contained within screenshots.&amp;lt;/p&amp;gt;</dc:description>
  <dc:identifier>https://doi.org/10.5281/zenodo.5822884</dc:identifier>
  <dc:identifier>oai:zenodo.org:5822884</dc:identifier>
  <dc:publisher>Zenodo</dc:publisher>
  <dc:relation>https://doi.org/10.5281/zenodo.5821839</dc:relation>
  <dc:rights>info:eu-repo/semantics/openAccess</dc:rights>
  <dc:rights>Creative Commons Attribution 4.0 International</dc:rights>
  <dc:rights>https://creativecommons.org/licenses/by/4.0/legalcode</dc:rights>
  <dc:subject>Software Documentation</dc:subject>
  <dc:subject>Android</dc:subject>
  <dc:subject>Screenshots</dc:subject>
  <dc:subject>Captions</dc:subject>
  <dc:title>The Clarity Software Documentation Dataset</dc:title>
  <dc:type>info:eu-repo/semantics/other</dc:type>
</oai_dc:dc>