{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2018-11-09T13:22:16.708054+00:00",
  "custom_fields": {},
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "D7.1 - Scalability and Robustness Experimental Methodology.pdf": {
        "checksum": "md5:496ef6ee51083255939dd4dca3289cbc",
        "ext": "pdf",
        "id": "a3e87cea-4abe-4b33-86af-7dae9cf17012",
        "key": "D7.1 - Scalability and Robustness Experimental Methodology.pdf",
        "metadata": null,
        "mimetype": "application/pdf",
        "size": 911331
      }
    },
    "order": [],
    "total_bytes": 911331
  },
  "id": "1481773",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/1481773/access",
    "access_grants": "https://zenodo.org/api/records/1481773/access/grants",
    "access_links": "https://zenodo.org/api/records/1481773/access/links",
    "access_request": "https://zenodo.org/api/records/1481773/access/request",
    "access_users": "https://zenodo.org/api/records/1481773/access/users",
    "archive": "https://zenodo.org/api/records/1481773/files-archive",
    "archive_media": "https://zenodo.org/api/records/1481773/media-files-archive",
    "communities": "https://zenodo.org/api/records/1481773/communities",
    "communities-suggestions": "https://zenodo.org/api/records/1481773/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.1481773",
    "draft": "https://zenodo.org/api/records/1481773/draft",
    "files": "https://zenodo.org/api/records/1481773/files",
    "latest": "https://zenodo.org/api/records/1481773/versions/latest",
    "latest_html": "https://zenodo.org/records/1481773/latest",
    "media_files": "https://zenodo.org/api/records/1481773/media-files",
    "parent": "https://zenodo.org/api/records/1481772",
    "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.1481772",
    "parent_html": "https://zenodo.org/records/1481772",
    "requests": "https://zenodo.org/api/records/1481773/requests",
    "reserve_doi": "https://zenodo.org/api/records/1481773/draft/pids/doi",
    "self": "https://zenodo.org/api/records/1481773",
    "self_doi": "https://zenodo.org/doi/10.5281/zenodo.1481773",
    "self_html": "https://zenodo.org/records/1481773",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:1481773/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:1481773/sequence/default",
    "versions": "https://zenodo.org/api/records/1481773/versions"
  },
  "media_files": {
    "count": 0,
    "enabled": false,
    "entries": {},
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "creators": [
      {
        "affiliations": [
          {
            "name": "CNR"
          }
        ],
        "person_or_org": {
          "family_name": "Mele",
          "given_name": "Ida",
          "identifiers": [
            {
              "identifier": "0000-0002-3730-6383",
              "scheme": "orcid"
            }
          ],
          "name": "Mele, Ida",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "CNR"
          }
        ],
        "person_or_org": {
          "family_name": "Tonellotto",
          "given_name": "Nicola",
          "identifiers": [
            {
              "identifier": "0000-0002-7427-1001",
              "scheme": "orcid"
            }
          ],
          "name": "Tonellotto, Nicola",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "CNR"
          }
        ],
        "person_or_org": {
          "family_name": "Nardini",
          "given_name": "Franco Maria",
          "identifiers": [
            {
              "identifier": "0000-0003-3183-334X",
              "scheme": "orcid"
            }
          ],
          "name": "Nardini, Franco Maria",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "CNR"
          }
        ],
        "person_or_org": {
          "family_name": "Perego",
          "given_name": "Raffaele",
          "identifiers": [
            {
              "identifier": "0000-0001-7189-4724",
              "scheme": "orcid"
            }
          ],
          "name": "Perego, Raffaele",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "CNR"
          }
        ],
        "person_or_org": {
          "family_name": "Monteiro de Lira",
          "given_name": "Vinicius",
          "identifiers": [
            {
              "identifier": "0000-0002-7580-1756",
              "scheme": "orcid"
            }
          ],
          "name": "Monteiro de Lira, Vinicius",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "CNR"
          }
        ],
        "person_or_org": {
          "family_name": "Muntean",
          "given_name": "Cristina",
          "identifiers": [
            {
              "identifier": "0000-0001-5265-1831",
              "scheme": "orcid"
            }
          ],
          "name": "Muntean, Cristina",
          "type": "personal"
        }
      }
    ],
    "description": "<p>The deliverable D7.1, &ldquo;Scalability and Robustness Experimental Methodology&rdquo; consists in a report describing the methodology for assessing the performance of a big data system. In particular, the purpose of the task 7.1 is to develop and to implement a rigorous automated testing methodology for measuring and comparing the efficiency of the components in a big data system. The methodology takes into account the characteristics of the system and also the heterogeneity and distributed nature of big data.</p>\n\n<p>In this first version of the deliverable, we present the general concepts related to big data and its properties (i.e., volume, velocity, variety, and veracity). We analyze the state-of-the-art for big data benchmarking considering different challenges which range from preserving the 4V properties of big data to streaming and scalability issues.</p>\n\n<p>Besides reviewing the literature, we present the steps that can be followed for providing a rigorous testing of the BDG system. We believe that it would be better to follow a layered design where the user interfaces are at the top in order to provide easy access to the benchmarking for the user. Below the interfaces, there are the functional and execution layers. The former allows to capture the data and test generators as well as the metrics; the latter represents the basic operations for configuring the system, converting the data, and analyzing the results.</p>\n\n<p>Another contribution of this deliverable is providing some guidelines that can be helpful in the process of rigorous testing a big data system. We believe that a good approach would be following a standardized benchmarking methodology which is divided into different stages going from the selection of the application domain to the execution of the tests. Since the BDG system is not finalized yet, these guidelines are very general and will be refined and concretized once the system will be developed.</p>\n\n<p>Since in the BDG project the semantic infrastructure is represented by graph databases, we also describe the main limitations of the current benchmarking in the context of relational databases and semantic repositories. Also, we provide some valid solutions for our project, for example, the benchmarks proposed by the Linked Data Benchmark Council (LDBC) which ensure linearity, reliability, repeatability, and easy to measure of the metrics. Additionally, LDBC is open for submissions of novel industry benchmarks which may represent specificity of data distribution in big data applications, and this makes it particularly suitable for the BDG project.</p>\n\n<p>Another contribution of this deliverable is a first proposal on the metrics to use for assessing the performance of the BDG system. Such metrics are chosen based on the datasets employed in the use cases of the BDG project. As for the guidelines, also the metrics are prone to changes since the use cases could be refined during the development of the project and the corresponding datasets and metrics would change accordingly.</p>",
    "funding": [
      {
        "award": {
          "acronym": "BigDataGrapes",
          "id": "00k4n6c32::780751",
          "identifiers": [
            {
              "identifier": "https://cordis.europa.eu/projects/780751",
              "scheme": "url"
            }
          ],
          "number": "780751",
          "program": "H2020",
          "title": {
            "en": "Big Data to Enable Global Disruption of the Grapevine-powered Industries"
          }
        },
        "funder": {
          "id": "00k4n6c32",
          "name": "European Commission"
        }
      }
    ],
    "languages": [
      {
        "id": "eng",
        "title": {
          "en": "English"
        }
      }
    ],
    "publication_date": "2018-09-28",
    "publisher": "Zenodo",
    "resource_type": {
      "id": "publication-deliverable",
      "title": {
        "de": "Projektergebnis",
        "en": "Project deliverable"
      }
    },
    "rights": [
      {
        "description": {
          "en": ""
        },
        "icon": "cc-by-nc-icon",
        "id": "cc-by-nc-4.0",
        "props": {
          "scheme": "spdx",
          "url": "https://creativecommons.org/licenses/by-nc/4.0/legalcode"
        },
        "title": {
          "en": "Creative Commons Attribution Non Commercial 4.0 International"
        }
      }
    ],
    "subjects": [
      {
        "subject": "4V properties;  big data; semantic infrastructure; graph databases"
      }
    ],
    "title": "BigDataGrapes D7.1 - Scalability and Robustness Experimental Methodology",
    "version": "1.0 | Final"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "48887"
      }
    },
    "communities": {
      "default": "ac1a29f8-93dc-4733-ae73-ab3eeb9c7f90",
      "entries": [
        {
          "access": {
            "member_policy": "open",
            "members_visibility": "public",
            "record_policy": "open",
            "review_policy": "open",
            "visibility": "public"
          },
          "children": {
            "allow": false
          },
          "created": "2018-06-27T22:24:39.054543+00:00",
          "custom_fields": {},
          "deletion_status": {
            "is_deleted": false,
            "status": "P"
          },
          "id": "ac1a29f8-93dc-4733-ae73-ab3eeb9c7f90",
          "links": {},
          "metadata": {
            "curation_policy": "<p>All public documentation and/or dissemination material produced by the BigDataGrapes project will be included under this community. Any material either not belonging to the above category or characterized as restricted will be declined.</p>\r\n",
            "page": "<p>The BigDataGrapes community includes most of the public deliverables, documents and dissemination material created through the H2020 BigDataGrapes Project (http://www.bigdatagrapes.eu/), which has received funding from the European Union&rsquo;s Horizon 2020 research and innovation programme under grant agreement No 780751</p>",
            "title": "BigDataGrapes Project"
          },
          "revision_id": 0,
          "slug": "bigdatagrapes",
          "updated": "2018-06-27T22:24:39.218097+00:00"
        },
        {
          "access": {
            "member_policy": "open",
            "members_visibility": "restricted",
            "record_policy": "open",
            "review_policy": "closed",
            "visibility": "public"
          },
          "children": {
            "allow": true
          },
          "created": "2022-11-23T15:53:29.436323+00:00",
          "custom_fields": {},
          "deletion_status": {
            "is_deleted": false,
            "status": "P"
          },
          "id": "f0a8b890-f97a-4eb2-9eac-8b8a712d3a6c",
          "links": {},
          "metadata": {
            "curation_policy": "<h2>Curation policy</h2>\n<p>The EU Open Research Repository serves as a repository for research outputs (data, software, posters, presentations, publications, etc) which have been funded under an EU research funding programme such as Horizon Europe, Euratom or earlier Framework Programmes.</p>\n<p>The community is managed by CERN on behalf of the European Commission.&nbsp;</p>\n<p><a href=\"https://about.zenodo.org/policies/\">Zenodo&rsquo;s general policies</a> and <a href=\"https://about.zenodo.org/terms/\">Terms of Use</a> apply to all content.</p>\n<h3>Scope</h3>\n<p>The EU Open Research Repository accepts all digital research objects which is a research output stemming from one of EU&rsquo;s research and innovation funding programmes. The funding programmes currently include:</p>\n<ul>\n<li>\n<p>Horizon Europe (including ERC, MSCA), earlier Framework Programmes (eg Horizon 2020) as well as Euratom.</p>\n</li>\n</ul>\n<p>In line with the principle as open as possible, as closed as necessary both public and restricted content is accepted. See note on how <a href=\"https://about.zenodo.org/infrastructure/\">Zenodo handles restricted content</a>.</p>\n<h3>Content submission</h3>\n<p>EU programme beneficiaries are eligible to submit content to the community. The community supports three types of content submissions:</p>\n<ul>\n<li>\n<p>Submission via an EU Project Community (through user interface or programmatic APIs).</p>\n</li>\n<li>\n<p>Submission directly to the EU Open Research Repository.</p>\n</li>\n<li>\n<p>Automated harvesting from existing Zenodo content.</p>\n</li>\n</ul>\n<h4>Project community (preferred)</h4>\n<p>A representative of an EU project may request an EU Project Community and invite other project participants as members of the community. The project community is linked to one or more European Commission grants. All records in the project community are automatically integrated into the EU Open Research Repository immediately upon acceptance into the project community.&nbsp;</p>\n<h4>Direct submission</h4>\n<p>Any user may submit a record directly to the EU Open Research Repository. The submission will be moderated by Zenodo staff for compliance with the minimal required metadata requirements and its correctness.</p>\n<h4>Automated harvesting</h4>\n<p>Records found among Zenodo&rsquo;s existing content will on a regular basis automatically be integrated if they are found to comply with the requirements. The submissions through this method are integrated into the EU Open Research Repository with delay in a fully automated way.</p>\n<h3>Descriptive information</h3>\n<h4>Minimal metadata requirements</h4>\n<p>Records in the EU Open Research Repository are required to comply with the following minimal metadata requirements:</p>\n<ul>\n<li>\n<p>Visibility: Both public and restricted (with or without embargo and/or access request)</p>\n</li>\n<li>\n<p>Resource types: All resource types.</p>\n</li>\n<li>\n<p>Licenses: Public and embargoed records MUST specify a license.</p>\n</li>\n<li>\n<p>Funding information: Records MUST specify at least one grant from the European Commission.</p>\n</li>\n<li>\n<p>Creators: Creators SHOULD be identified with a persistent identifier (e.g. ORCID, GND, &hellip;), and affiliations SHOULD be identified with a persistent identifier (e.g. ROR, ISNI, &hellip;)</p>\n</li>\n<li>\n<p>Subjects: Records SHOULD specify one or more fields of science from the <a href=\"https://op.europa.eu/en/web/eu-vocabularies/euroscivoc\">European Science Vocabulary</a>.</p>\n</li>\n</ul>\n<h3>Review &amp; moderation</h3>\n<p>All submissions will undergo automated curation checks for compliance with the policy. Submissions through project communities are reviewed by the project community. Submission directly to the EU Open Research Repository is reviewed by Zenodo staff.</p>\n<p>Community curators may at any point edit metadata of the records in the community without notice through human or automated processing. The curators may at their sole discretion remove records from the community that are deemed not to comply with the content and curation policy or which are deemed of insufficient quality.</p>\n<h3>Updates</h3>\n<p>The content and curation policy is subject to change by the community owner at any time and without notice, other than through updating this page.</p>",
            "description": "Open repository for EU-funded research outputs from Horizon Europe, Euratom and earlier Framework Programmes.",
            "organizations": [
              {
                "id": "00k4n6c32"
              }
            ],
            "page": "<h2>About</h2>\n<p>The EU Open Research Repository is a Zenodo-community dedicated to fostering open science and enhancing the visibility and accessibility of research outputs funded by the European Union. The community is managed by CERN on behalf of the European Commission.</p>\n<h3>Mission</h3>\n<p>The mission of the repository is to support the implementation of the EU's open science policy, providing a trusted and comprehensive space for researchers to share their research outputs such as data, software, reports, presentations, posters and more. The EU Open Research Repository simplifies the process of complying with open science requirements, ensuring that research outputs from Horizon Europe, Euratom, and earlier Framework Programmes are freely accessible, thereby accelerating scientific discovery and innovation.</p>\n<h3>EU Open Research Repository vs Open Research Europe (ORE)</h3>\n<p>The EU Open Research Repository serves as a complementary platform to the <a href=\"https://open-research-europe.ec.europa.eu/\">Open Research Europe</a> (ORE) publishing platform. Open Research Europe focuses on providing a publishing venue for peer-reviewed articles, ensuring that research meets rigorous academic standards. The EU Open Research Repository provides a space for all the other research outputs including data sets, software, posters, and presentations that are out of scope for ORE. This holistic approach enables researchers to not only publish their findings but also share the underlying data and materials that support their work, fostering transparency and reproducibility in the scientific process.&nbsp;</p>\n<h3>Pilot phase</h3>\n<p>Currently in its pilot phase and set to be fully operational during autumn 2024, the EU Open Research Repository is constantly evolving. Efforts are committed to integrating cutting-edge features, including automated curation checks and FAIR (Findable, Accessible, Interoperable, and Reusable) assistance, to further support the research community. The goal is to provide researchers with a simple goto solution for making their publicly funded research open and as FAIR as possible.<strong>&nbsp;</strong></p>\n<h3>Funding</h3>\n<p>The EU Open Research Repository is funded by the European Union under grant agreement no. <a href=\"https://cordis.europa.eu/project/id/101122956\">101122956</a>(HORIZON-ZEN). For more information about the project see <a href=\"https://about.zenodo.org/projects/horizon-zen/\">https://about.zenodo.org/projects/horizon-zen/.</a></p>",
            "title": "EU Open Research Repository (Pilot)",
            "type": {
              "id": "organization"
            },
            "website": "https://research-and-innovation.ec.europa.eu"
          },
          "revision_id": 16,
          "slug": "eu",
          "theme": {
            "brand": "horizon",
            "enabled": true,
            "style": {
              "font": {
                "family": "Arial, sans-serif",
                "size": "16px",
                "weight": 600
              },
              "mainHeaderBackgroundColor": "#FFFFFF",
              "primaryColor": "#004494",
              "primaryTextColor": "#FFFFFF",
              "secondaryColor": "#FFD617",
              "secondaryTextColor": "#000000",
              "tertiaryColor": "#e3eefd",
              "tertiaryTextColor": "#1c5694"
            }
          },
          "updated": "2024-03-20T06:47:47.577483+00:00"
        }
      ],
      "ids": [
        "ac1a29f8-93dc-4733-ae73-ab3eeb9c7f90",
        "f0a8b890-f97a-4eb2-9eac-8b8a712d3a6c"
      ]
    },
    "id": "1481772",
    "pids": {
      "doi": {
        "client": "datacite",
        "identifier": "10.5281/zenodo.1481772",
        "provider": "datacite"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.1481773",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:1481773",
      "provider": "oai"
    }
  },
  "revision_id": 9,
  "stats": {
    "all_versions": {
      "data_volume": 170621424.0,
      "downloads": 176,
      "unique_downloads": 147,
      "unique_views": 199,
      "views": 230
    },
    "this_version": {
      "data_volume": 54679860.0,
      "downloads": 60,
      "unique_downloads": 54,
      "unique_views": 88,
      "views": 103
    }
  },
  "status": "published",
  "updated": "2020-01-20T16:47:16.022918+00:00",
  "versions": {
    "index": 1,
    "is_latest": false
  }
}