{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2022-02-24T17:04:12.905529+00:00",
  "custom_fields": {},
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "D3.2-Design, implementation and deployment of text mining and enrichment services Phase 1_v1.0.pdf": {
        "access": {
          "hidden": false
        },
        "checksum": "md5:8cb1a8a2eec9993476af23eae18c512e",
        "ext": "pdf",
        "id": "3bc0c2e6-f222-4498-9dd2-0cd8caf28d97",
        "key": "D3.2-Design, implementation and deployment of text mining and enrichment services Phase 1_v1.0.pdf",
        "links": {
          "content": "https://zenodo.org/api/records/6260513/files/D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/content",
          "iiif_api": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/full/full/0/default.png",
          "iiif_base": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf",
          "iiif_canvas": "https://zenodo.org/api/iiif/record:6260513/canvas/D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf",
          "iiif_info": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/info.json",
          "self": "https://zenodo.org/api/records/6260513/files/D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf"
        },
        "metadata": null,
        "mimetype": "application/pdf",
        "size": 1189605,
        "storage_class": "L"
      }
    },
    "order": [],
    "total_bytes": 1189605
  },
  "id": "6260513",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/6260513/access",
    "access_grants": "https://zenodo.org/api/records/6260513/access/grants",
    "access_links": "https://zenodo.org/api/records/6260513/access/links",
    "access_request": "https://zenodo.org/api/records/6260513/access/request",
    "access_users": "https://zenodo.org/api/records/6260513/access/users",
    "archive": "https://zenodo.org/api/records/6260513/files-archive",
    "archive_media": "https://zenodo.org/api/records/6260513/media-files-archive",
    "communities": "https://zenodo.org/api/records/6260513/communities",
    "communities-suggestions": "https://zenodo.org/api/records/6260513/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.6260513",
    "draft": "https://zenodo.org/api/records/6260513/draft",
    "file_modification": "https://zenodo.org/api/records/6260513/file-modification",
    "files": "https://zenodo.org/api/records/6260513/files",
    "latest": "https://zenodo.org/api/records/6260513/versions/latest",
    "latest_html": "https://zenodo.org/records/6260513/latest",
    "media_files": "https://zenodo.org/api/records/6260513/media-files",
    "parent": "https://zenodo.org/api/records/6260512",
    "parent_doi": "https://doi.org/10.5281/zenodo.6260512",
    "parent_doi_html": "https://zenodo.org/doi/10.5281/zenodo.6260512",
    "parent_html": "https://zenodo.org/records/6260512",
    "preview_html": "https://zenodo.org/records/6260513?preview=1",
    "quota_increase": "https://zenodo.org/api/records/6260513/quota-increase",
    "request_deletion": "https://zenodo.org/api/records/6260513/request-deletion",
    "requests": "https://zenodo.org/api/records/6260513/requests",
    "reserve_doi": "https://zenodo.org/api/records/6260513/draft/pids/doi",
    "self": "https://zenodo.org/api/records/6260513",
    "self_doi": "https://doi.org/10.5281/zenodo.6260513",
    "self_doi_html": "https://zenodo.org/doi/10.5281/zenodo.6260513",
    "self_html": "https://zenodo.org/records/6260513",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:6260513/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:6260513/sequence/default",
    "thumbnails": {
      "10": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/full/%5E10,/0/default.jpg",
      "100": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/full/%5E100,/0/default.jpg",
      "1200": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/full/%5E1200,/0/default.jpg",
      "250": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/full/%5E250,/0/default.jpg",
      "50": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/full/%5E50,/0/default.jpg",
      "750": "https://zenodo.org/api/iiif/record:6260513:D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf/full/%5E750,/0/default.jpg"
    },
    "versions": "https://zenodo.org/api/records/6260513/versions"
  },
  "media_files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "D3.2-Design, implementation and deployment of text mining and enrichment services Phase 1_v1.0.pdf.ptif": {
        "access": {
          "hidden": true
        },
        "ext": "ptif",
        "id": "5113fa58-66b4-4fab-83ea-544d92ffbb37",
        "key": "D3.2-Design, implementation and deployment of text mining and enrichment services Phase 1_v1.0.pdf.ptif",
        "links": {
          "content": "https://zenodo.org/api/records/6260513/files/D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf.ptif/content",
          "self": "https://zenodo.org/api/records/6260513/files/D3.2-Design,%20implementation%20and%20deployment%20of%20text%20mining%20and%20enrichment%20services%20Phase%201_v1.0.pdf.ptif"
        },
        "metadata": null,
        "mimetype": "application/octet-stream",
        "processor": {
          "source_file_id": "3bc0c2e6-f222-4498-9dd2-0cd8caf28d97",
          "status": "finished",
          "type": "image-tiles"
        },
        "size": 0,
        "storage_class": "L"
      }
    },
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "additional_descriptions": [
      {
        "description": "This is the draft version of the deliverable not yet approved by the European Commission.",
        "type": {
          "id": "notes",
          "title": {
            "de": "Anmerkungen",
            "en": "Notes"
          }
        }
      }
    ],
    "creators": [
      {
        "affiliations": [
          {
            "name": "Expert.ai"
          }
        ],
        "person_or_org": {
          "family_name": "Raul Ortega",
          "name": "Raul Ortega",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "Expert.ai"
          }
        ],
        "person_or_org": {
          "family_name": "Andres Garcia-Silva",
          "name": "Andres Garcia-Silva",
          "type": "personal"
        }
      },
      {
        "affiliations": [
          {
            "name": "Expert.ai"
          }
        ],
        "person_or_org": {
          "family_name": "Jose Manuel Gomez-Perez",
          "name": "Jose Manuel Gomez-Perez",
          "type": "personal"
        }
      }
    ],
    "description": "<p>This deliverable reports the progress in the design and development of the first version of the text mining and enrichment services for Research Objects and scientific documents in RELIANCE. In the early stage of the project, we gathered a corpus of scientific documents in the domains of interest for RELIANCE user communities that was used to customize the knowledge graph underlying the text mining and enrichment services. Once the knowledge graph was adapted to the scientific vocabulary used by RELIANCE users, we were ready to start the development of the text mining and enrichment services.</p>\n\n<p>Among such services is the semantic enrichment service of Research Objects and Scientific documents. The enrichment service processes the text from documents or Research objects and yields semantic metadata describing the text content. The semantic metadata is a synthesis of the text and includes concepts, lemmas, multi-word expressions, and topics. In addition, we are working on the generation of a Field of Research metadata that we plan to integrate in the enrichment service. To generate this type of metadata, we trained a classifier by fine-tuning a pre-trained RoBERTa language model on the corpus that we gathered for RELIANCE users where scientific papers are tagged with Field of Research categories (e.g., Geology, Oceanography, or Atmospheric Sciences). The enrichment service for documents is already onboarded in EOSC as a RESTful service, and the service that enriches Research Objects is integrated in ROHub.</p>\n\n<p>Next, we developed information retrieval tools exploiting the semantic metadata added to Research Objects along with their text content. First, a faceted search engine where users can search the Research Objects collection in ROHub using the traditional keywords, but also facets for each of the types of the semantic metadata. A faceted search engine allows complex queries and retrieving Research Objects more precisely. Second, a recommendation engine that suggests potentially relevant research objects based on the content of a selection of other research objects or users. If the reference is a research object, the recommendation engine uses the semantic metadata of the research object to recommend similar research objects. If the reference is a user, the recommendation engine first aggregates all the semantic metadata of the research objects owned by such user and then uses the semantic metadata to suggest relevant research objects. The search engine and the recommendation system are being onboarded in EOSC as RESTful services.</p>\n\n<p>During this stage of the project, we lay the foundations for the development in the next phase of the extended set of analytics services where we plan to address the Influence Network Extraction, the Novelty Score for Research Objects, Support to Reading Comprehension, and Text Mining and Enrichment Dashboard. While the design and development of such services will be covered in depth in the second version of this deliverable, in this version we have included a brief description of each of them. In the second version of this deliverable, we plan to increase the metadata produced by the enrichment service including titles, abstracts, authors, citations, and data cube references.</p>\n\n<p>Finally, in the second phase of the project we will work on the user interfaces for the recommendation system, the search engine, the visualization of the semantic enrichment results for research objects, and a prototype of a browser plugin that allows scientists to ingest scientific publications into their bibliographic research objects as they browse the internet searching for relevant literature for their research.</p>",
    "funding": [
      {
        "award": {
          "acronym": "RELIANCE",
          "id": "00k4n6c32::101017501",
          "identifiers": [
            {
              "identifier": "https://cordis.europa.eu/projects/101017501",
              "scheme": "url"
            }
          ],
          "number": "101017501",
          "program": "H2020-EU.1.4.",
          "title": {
            "en": "REsearch LIfecycle mAnagemeNt for Earth Science Communities and CopErnicus users in EOSC"
          }
        },
        "funder": {
          "id": "00k4n6c32",
          "name": "European Commission"
        }
      }
    ],
    "languages": [
      {
        "id": "eng",
        "title": {
          "en": "English"
        }
      }
    ],
    "publication_date": "2022-01-07",
    "publisher": "Zenodo",
    "resource_type": {
      "id": "publication-deliverable",
      "title": {
        "de": "Projektergebnis",
        "en": "Project deliverable"
      }
    },
    "rights": [
      {
        "description": {
          "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited."
        },
        "icon": "cc-by-icon",
        "id": "cc-by-4.0",
        "props": {
          "scheme": "spdx",
          "url": "https://creativecommons.org/licenses/by/4.0/legalcode"
        },
        "title": {
          "en": "Creative Commons Attribution 4.0 International"
        }
      }
    ],
    "subjects": [
      {
        "subject": "RELIANCE"
      },
      {
        "subject": "Research Objects"
      },
      {
        "subject": "ROhub"
      },
      {
        "subject": "RO-Crate"
      },
      {
        "subject": "Data cubes"
      },
      {
        "subject": "EOSC"
      }
    ],
    "title": "D3.2v1 Design, implementation and deployment of text mining and enrichment services Phase 1",
    "version": "Version 1.0"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "237794"
      }
    },
    "communities": {
      "entries": [
        {
          "access": {
            "member_policy": "open",
            "members_visibility": "restricted",
            "record_submission_policy": "open",
            "review_policy": "closed",
            "visibility": "public"
          },
          "children": {
            "allow": true
          },
          "created": "2022-11-23T15:53:29.436323+00:00",
          "custom_fields": {},
          "deletion_status": {
            "is_deleted": false,
            "status": "P"
          },
          "id": "f0a8b890-f97a-4eb2-9eac-8b8a712d3a6c",
          "links": {},
          "metadata": {
            "curation_policy": "<h2>Curation policy</h2>\n<p>The EU Open Research Repository serves as a repository for research outputs (data, software, posters, presentations, publications, etc) which have been funded under an EU research funding programme such as Horizon Europe, Euratom or earlier Framework Programmes.</p>\n<p>The community is managed by CERN on behalf of the European Commission.&nbsp;</p>\n<p><a href=\"https://about.zenodo.org/policies/\">Zenodo&rsquo;s general policies</a> and <a href=\"https://about.zenodo.org/terms/\">Terms of Use</a> apply to all content.</p>\n<h3>Scope</h3>\n<p>The EU Open Research Repository accepts all digital research objects which is a research output stemming from one of EU&rsquo;s research and innovation funding programmes. The funding programmes currently include:</p>\n<ul>\n<li>\n<p>Horizon Europe (including ERC, MSCA), earlier Framework Programmes (eg Horizon 2020) as well as Euratom.</p>\n</li>\n</ul>\n<p>In line with the principle as open as possible, as closed as necessary both public and restricted content is accepted. See note on how <a href=\"https://about.zenodo.org/infrastructure/\">Zenodo handles restricted content</a>.</p>\n<h3>Content submission</h3>\n<p>EU programme beneficiaries are eligible to submit content to the community. The community supports three types of content submissions:</p>\n<ul>\n<li>\n<p>Submission via an EU Project Community (through user interface or programmatic APIs).</p>\n</li>\n<li>\n<p>Submission directly to the EU Open Research Repository.</p>\n</li>\n<li>\n<p>Automated harvesting from existing Zenodo content.</p>\n</li>\n</ul>\n<h4>Project community (preferred)</h4>\n<p>A representative of an EU project may request an EU Project Community and invite other project participants as members of the community. The project community is linked to one or more European Commission grants. All records in the project community are automatically integrated into the EU Open Research Repository immediately upon acceptance into the project community.&nbsp;</p>\n<h4>Direct submission</h4>\n<p>Any user may submit a record directly to the EU Open Research Repository. The submission will be moderated by Zenodo staff for compliance with the minimal required metadata requirements and its correctness.</p>\n<h4>Automated harvesting</h4>\n<p>Records found among Zenodo&rsquo;s existing content will on a regular basis automatically be integrated if they are found to comply with the requirements. The submissions through this method are integrated into the EU Open Research Repository with delay in a fully automated way.</p>\n<h3>Descriptive information</h3>\n<h4>Minimal metadata requirements</h4>\n<p>Records in the EU Open Research Repository are required to comply with the following minimal metadata requirements:</p>\n<ul>\n<li>\n<p>Visibility: Both public and restricted (with or without embargo and/or access request)</p>\n</li>\n<li>\n<p>Resource types: All resource types.</p>\n</li>\n<li>\n<p>Licenses: Public and embargoed records MUST specify a license. The chosen license SHOULD be compliant with the Horizon Europe open science requirements (see <a href=\"/communities/eu/pages/open-science\">Open Science in Horizon Europe</a>)</p>\n</li>\n<li>\n<p>Funding information: Records MUST specify at least one grant from the European Commission.</p>\n</li>\n<li>Journal articles: Records MUST specify at the publishing venue (e.g. the journal the article was published in).</li>\n<li>\n<p>Creators: Creators SHOULD be identified with a persistent identifier (e.g. ORCID, GND, &hellip;), and affiliations SHOULD be identified with a persistent identifier (e.g. ROR, ISNI, &hellip;)</p>\n</li>\n<li>\n<p>Subjects: Records SHOULD specify one or more fields of science from the <a href=\"https://op.europa.eu/en/web/eu-vocabularies/euroscivoc\">European Science Vocabulary</a>.</p>\n</li>\n</ul>\n<p>These metadata requirements comes from the related open science requirements in Horizon Europe which are detailed in each project's grant agreement.</p>\n<h3>Review &amp; moderation</h3>\n<p>All submissions undergo automated curation checks for compliance with the policy. Submissions through project communities are in addition reviewed by the project community. Submission directly to the EU Open Research Repository is in addiotn reviewed by Zenodo staff.</p>\n<p>Community curators may at any point edit metadata of the records in the community without notice through human or automated processing. The curators may at their sole discretion remove records from the community that are deemed not to comply with the content and curation policy or which are deemed of insufficient quality.</p>\n<h3>Updates</h3>\n<p>The content and curation policy is subject to change by the community owner at any time and without notice, other than through updating this page.</p>",
            "description": "Open repository for EU-funded research outputs from Horizon Europe, Euratom, and earlier Framework Programmes.",
            "funding": [
              {
                "funder": {
                  "id": "00k4n6c32"
                }
              }
            ],
            "organizations": [
              {
                "id": "00k4n6c32"
              }
            ],
            "page": "<h2>About</h2>\n<p>The EU Open Research Repository is a Zenodo-community dedicated to fostering open science and enhancing the visibility and accessibility of research outputs funded by the European Union. The community is managed by CERN on behalf of the European Commission.</p>\n<h3>Mission</h3>\n<p>The mission of the repository is to support the implementation of the EU's open science policy, providing a trusted and comprehensive space for researchers to share their research outputs such as data, software, reports, presentations, posters and more. The EU Open Research Repository simplifies the process of complying with open science requirements, ensuring that research outputs from Horizon Europe, Euratom, and earlier Framework Programmes are freely accessible, thereby accelerating scientific discovery and innovation.</p>\n<h3>EU Open Research Repository vs Open Research Europe (ORE)</h3>\n<p>The EU Open Research Repository serves as a complementary platform to the <a href=\"https://open-research-europe.ec.europa.eu/\">Open Research Europe</a> (ORE) publishing platform. Open Research Europe focuses on providing a publishing venue for peer-reviewed articles, ensuring that research meets rigorous academic standards. The EU Open Research Repository provides a space for all the other research outputs including data sets, software, posters, and presentations that are out of scope for ORE. This holistic approach enables researchers to not only publish their findings but also share the underlying data and materials that support their work, fostering transparency and reproducibility in the scientific process.&nbsp;</p>\n<h3>Funding</h3>\n<p>The EU Open Research Repository is funded by the European Union under grant agreement no. <a href=\"https://cordis.europa.eu/project/id/101256740\">101256740</a>&nbsp; (HORIZON-ZEN Plus). For more information about the project see <a href=\"https://about.zenodo.org/projects/horizon-zen-plus/\">https://about.zenodo.org/projects/horizon-zen/.</a></p>",
            "title": "EU Open Research Repository",
            "type": {
              "id": "organization"
            },
            "website": "https://research-and-innovation.ec.europa.eu"
          },
          "revision_id": 24,
          "slug": "eu",
          "theme": {
            "brand": "horizon",
            "enabled": true,
            "style": {
              "font": {
                "family": "Arial, sans-serif",
                "size": "16px",
                "weight": 600
              },
              "mainHeaderBackgroundColor": "#FFFFFF",
              "primaryColor": "#004494",
              "primaryTextColor": "#FFFFFF",
              "secondaryColor": "#FFD617",
              "secondaryTextColor": "#000000",
              "tertiaryColor": "#e3eefd",
              "tertiaryTextColor": "#1c5694"
            }
          },
          "updated": "2026-03-31T12:29:43.596724+00:00"
        }
      ],
      "ids": [
        "f0a8b890-f97a-4eb2-9eac-8b8a712d3a6c"
      ]
    },
    "id": "6260512",
    "pids": {
      "doi": {
        "client": "datacite",
        "identifier": "10.5281/zenodo.6260512",
        "provider": "datacite"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.6260513",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:6260513",
      "provider": "oai"
    }
  },
  "revision_id": 7,
  "stats": {
    "all_versions": {
      "data_volume": 128477340.0,
      "downloads": 108,
      "unique_downloads": 108,
      "unique_views": 125,
      "views": 125
    },
    "this_version": {
      "data_volume": 124908525.0,
      "downloads": 105,
      "unique_downloads": 105,
      "unique_views": 122,
      "views": 122
    }
  },
  "status": "published",
  "swh": {},
  "updated": "2024-07-17T09:59:06.189248+00:00",
  "versions": {
    "index": 1,
    "is_latest": true
  }
}