{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2017-04-12T13:17:57.791485+00:00",
  "custom_fields": {
    "meeting:meeting": {
      "acronym": "CVPR",
      "dates": "21-26 July 2017",
      "title": "Computer Vision and Pattern Recognition"
    }
  },
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "CAD_release.tar.gz": {
        "checksum": "md5:be832f74fa4a3db7644f9e47175d4bc3",
        "ext": "gz",
        "id": "e2ddf17e-2740-438c-a23b-e07c3f309f3a",
        "key": "CAD_release.tar.gz",
        "metadata": null,
        "mimetype": "application/gzip",
        "size": 2570322318
      }
    },
    "order": [],
    "total_bytes": 2570322318
  },
  "id": "495570",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/495570/access",
    "access_grants": "https://zenodo.org/api/records/495570/access/grants",
    "access_links": "https://zenodo.org/api/records/495570/access/links",
    "access_request": "https://zenodo.org/api/records/495570/access/request",
    "access_users": "https://zenodo.org/api/records/495570/access/users",
    "archive": "https://zenodo.org/api/records/495570/files-archive",
    "archive_media": "https://zenodo.org/api/records/495570/media-files-archive",
    "communities": "https://zenodo.org/api/records/495570/communities",
    "communities-suggestions": "https://zenodo.org/api/records/495570/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.495570",
    "draft": "https://zenodo.org/api/records/495570/draft",
    "files": "https://zenodo.org/api/records/495570/files",
    "latest": "https://zenodo.org/api/records/495570/versions/latest",
    "latest_html": "https://zenodo.org/records/495570/latest",
    "media_files": "https://zenodo.org/api/records/495570/media-files",
    "parent": "https://zenodo.org/api/records/795703",
    "parent_doi": "https://zenodo.org/doi/",
    "parent_html": "https://zenodo.org/records/795703",
    "requests": "https://zenodo.org/api/records/495570/requests",
    "reserve_doi": "https://zenodo.org/api/records/495570/draft/pids/doi",
    "self": "https://zenodo.org/api/records/495570",
    "self_doi": "https://zenodo.org/doi/10.5281/zenodo.495570",
    "self_html": "https://zenodo.org/records/495570",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:495570/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:495570/sequence/default",
    "versions": "https://zenodo.org/api/records/495570/versions"
  },
  "media_files": {
    "count": 0,
    "enabled": false,
    "entries": {},
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "additional_descriptions": [
      {
        "description": "Acknowledgments. The work has been financially sup-\nported by the DFG projects GA 1927/5-1 (DFG Research\nUnit FOR 2535 Anticipating Human Behavior) and GA\n1927/2-2 (DFG Research Unit FOR 1505 Mapping on De-\nmand).",
        "type": {
          "id": "notes",
          "title": {
            "de": "Anmerkungen",
            "en": "Notes"
          }
        }
      }
    ],
    "creators": [
      {
        "affiliations": [
          {
            "name": "University of Bonn"
          }
        ],
        "person_or_org": {
          "family_name": "Sawatzky",
          "given_name": "Johann",
          "name": "Sawatzky, Johann",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "Carl Zeiss AG"
          }
        ],
        "person_or_org": {
          "family_name": "Srikantha",
          "given_name": "Abhilash",
          "name": "Srikantha, Abhilash",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "University of Bonn"
          }
        ],
        "person_or_org": {
          "family_name": "Gall",
          "given_name": "Juergen",
          "name": "Gall, Juergen",
          "type": "personal"
        }
      }
    ],
    "description": "<p>% ==============================================================================<br>\n% CAD 120 Affordance Dataset<br>\n% Version 1.0<br>\n% ------------------------------------------------------------------------------<br>\n% If you use the dataset please cite:<br>\n%<br>\n% Johann Sawatzky, Abhilash Srikantha, Juergen Gall.<br>\n% Weakly Supervised Affordance Detection.<br>\n% IEEE Conference on Computer Vision and Pattern Recognition (CVPR'17)<br>\n%<br>\n% and<br>\n%<br>\n% H. S. Koppula and A. Saxena.<br>\n% Physically grounded spatio-temporal object affordances.<br>\n% European Conference on Computer Vision (ECCV'14)<br>\n%<br>\n% Any bugs or questions, please email sawatzky AT iai DOT uni-bonn DOT de.<br>\n% ==============================================================================</p>\n\n<p>This is the CAD 120 Affordance Segmentation Dataset based on the Cornell Activity<br>\nDataset CAD 120 (see http://pr.cs.cornell.edu/humanactivities/data.php).</p>\n\n<p>Content</p>\n\n<p>frames/*.png:<br>\nRGB frames selected from Cornell Activity Dataset. To find out the location of the frame<br>\nin the original videos, see video_info.txt.</p>\n\n<p>object_crop_images/*.png<br>\nimage crops taken from the selected frames and resized to 321*321. Each crop is a padded<br>\nbounding box of an object the human interacts with in the video. Due to the padding,<br>\nthe crops may contain background and other objects.<br>\nIn each selected frame, each bounding box was processed. The bounding boxes are already<br>\ngiven in the Cornell Activity Dataset.<br>\nThe 5-digit number gives the frame number, the second number gives the bounding box number<br>\nwithin the frame.</p>\n\n<p>segmentation_mat/*.mat<br>\n321*321*6 segmentation masks for the image crops. Each channel corresponds to an<br>\naffordance (openabe, cuttable, pourable, containable, supportable, holdable, in this order).<br>\nAll pixels belonging to a particular affordance are labeled 1 in the respective channel,<br>\notherwise 0. \u00a0</p>\n\n<p>segmentation_png/*.png<br>\n321*321 png images, each containing the binary mask for one of the affordances.</p>\n\n<p>lists/*.txt<br>\nLists containing the train and test sets for two splits. The actor split ensures that<br>\ntrain and test images stem from different videos with different actors while the object split ensures<br>\nthat train and test data have no (central) object classes in common.<br>\nThe train sets are additionally subdivided into 3 subsets A,B and C. For the actor split,<br>\nthe subsets stem from different videos. For the object split, each subset contains<br>\nevery third crop of the train set.</p>\n\n<p>crop_coordinate_info.txt<br>\nMaps image crops to their coordinates in the frames.</p>\n\n<p>hpose_info.txt<br>\nMaps frames to 2d human pose coordinates. Hand annotated by us.</p>\n\n<p>object_info.txt<br>\nMaps image crops to the (central) object it contains.</p>\n\n<p>visible_affordance_info.txt<br>\nMaps image crops to affordances visible in this crop</p>\n\n<p>\u00a0</p>\n\n<p>%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%55<br>\nThe crops contain the following object classes:<br>\n1.table<br>\n2.kettle<br>\n3.plate<br>\n4.bottle<br>\n5.thermal cup<br>\n6.knife<br>\n7.medicine box<br>\n8.can<br>\n9.microwave<br>\n10.paper box<br>\n11.bowl<br>\n12.mug</p>\n\n<p>Affordances in our set:<br>\n1.openable<br>\n2.cuttable<br>\n3.pourable<br>\n4.containable<br>\n5.supportable<br>\n6.holdable</p>\n\n<p>Note that our object affordance labeling differs from the Cornell Activity Dataset:<br>\nE.g. the cap of a pizza box is considered to be supportable.</p>\n\n<p>\u00a0</p>",
    "publication_date": "2017-04-07",
    "publisher": "Zenodo",
    "references": [
      {
        "reference": "Sawatzky, J., Srikantha, A., Gall, J.: Weakly supervised affordance detection.  CVPR (2017)"
      }
    ],
    "related_identifiers": [
      {
        "identifier": "https://pages.iai.uni-bonn.de/gall_juergen/download/jgall_affordancedetection_cvpr17.pdf",
        "relation_type": {
          "id": "issupplementto",
          "title": {
            "de": "Erg\u00e4nzt",
            "en": "Is supplement to"
          }
        },
        "scheme": "url"
      },
      {
        "identifier": "https://github.com/ykztawas/Weakly-Supervised-Affordance-Detection",
        "relation_type": {
          "id": "issupplementto",
          "title": {
            "de": "Erg\u00e4nzt",
            "en": "Is supplement to"
          }
        },
        "scheme": "url"
      }
    ],
    "resource_type": {
      "id": "dataset",
      "title": {
        "de": "Datensatz",
        "en": "Dataset"
      }
    },
    "rights": [
      {
        "description": {
          "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited."
        },
        "icon": "cc-by-icon",
        "id": "cc-by-4.0",
        "props": {
          "scheme": "spdx",
          "url": "https://creativecommons.org/licenses/by/4.0/legalcode"
        },
        "title": {
          "en": "Creative Commons Attribution 4.0 International"
        }
      }
    ],
    "subjects": [
      {
        "subject": "computer vision"
      },
      {
        "subject": "affordances"
      },
      {
        "subject": "attributes"
      },
      {
        "subject": "semantic image segmentation"
      },
      {
        "subject": "robotics"
      },
      {
        "subject": "weakly supervised learning"
      },
      {
        "subject": "convolutional neural network"
      },
      {
        "subject": "anticipating human behavior"
      },
      {
        "subject": "mapping on demand"
      }
    ],
    "title": "CAD 120 affordance dataset"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "29724"
      }
    },
    "communities": {},
    "id": "795703",
    "pids": {
      "doi": {
        "identifier": "",
        "provider": "legacy"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.495570",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:495570",
      "provider": "oai"
    }
  },
  "revision_id": 7,
  "stats": {
    "all_versions": {
      "data_volume": 7446223755246.0,
      "downloads": 2897,
      "unique_downloads": 1130,
      "unique_views": 4510,
      "views": 5153
    },
    "this_version": {
      "data_volume": 7425661176702.0,
      "downloads": 2889,
      "unique_downloads": 1122,
      "unique_views": 4470,
      "views": 5109
    }
  },
  "status": "published",
  "updated": "2020-01-24T19:26:07.043850+00:00",
  "versions": {
    "index": 1,
    "is_latest": true
  }
}