Conference paper Open Access

Leveraging Linguistic Linked Data for Cross-Lingual Model Transfer in the Pharmaceutical Domain

Jorge Gracia; Christian Fäth; Matthias Hartung; Max Ionov; Julia Bosque-Gil; Susana Veríssimo; Christian Chiarcos; Matthias Orlikowski


JSON Export

{
  "files": [
    {
      "links": {
        "self": "https://zenodo.org/api/files/73a8648b-ddb0-40e5-a3ba-33ad5b23489e/PaL_Apertium_RDF_pipeline.pdf"
      }, 
      "checksum": "md5:24c25cc5c94b00ccd86c05fb1e0b40d3", 
      "bucket": "73a8648b-ddb0-40e5-a3ba-33ad5b23489e", 
      "key": "PaL_Apertium_RDF_pipeline.pdf", 
      "type": "pdf", 
      "size": 721008
    }
  ], 
  "owners": [
    78313
  ], 
  "doi": "10.1007/978-3-030-62466-8_31", 
  "stats": {
    "version_unique_downloads": 34.0, 
    "unique_views": 23.0, 
    "views": 24.0, 
    "version_views": 24.0, 
    "unique_downloads": 34.0, 
    "version_unique_views": 23.0, 
    "volume": 25235280.0, 
    "version_downloads": 35.0, 
    "downloads": 35.0, 
    "version_volume": 25235280.0
  }, 
  "links": {
    "doi": "https://doi.org/10.1007/978-3-030-62466-8_31", 
    "latest_html": "https://zenodo.org/record/4322607", 
    "bucket": "https://zenodo.org/api/files/73a8648b-ddb0-40e5-a3ba-33ad5b23489e", 
    "badge": "https://zenodo.org/badge/doi/10.1007/978-3-030-62466-8_31.svg", 
    "html": "https://zenodo.org/record/4322607", 
    "latest": "https://zenodo.org/api/records/4322607"
  }, 
  "created": "2020-12-15T10:32:55.221461+00:00", 
  "updated": "2020-12-15T13:28:16.622377+00:00", 
  "conceptrecid": "4322606", 
  "revision": 3, 
  "id": 4322607, 
  "metadata": {
    "access_right_category": "success", 
    "part_of": {
      "pages": "499-514", 
      "title": "The Semantic Web \u2013 ISWC 2020 19th International Semantic Web Conference, Part II"
    }, 
    "doi": "10.1007/978-3-030-62466-8_31", 
    "version": "pre-published version", 
    "license": {
      "id": "CC-BY-4.0"
    }, 
    "title": "Leveraging Linguistic Linked Data for Cross-Lingual Model Transfer in the Pharmaceutical Domain", 
    "relations": {
      "version": [
        {
          "count": 1, 
          "index": 0, 
          "parent": {
            "pid_type": "recid", 
            "pid_value": "4322606"
          }, 
          "is_last": true, 
          "last_child": {
            "pid_type": "recid", 
            "pid_value": "4322607"
          }
        }
      ]
    }, 
    "access_right": "open", 
    "imprint": {
      "publisher": "Springer", 
      "isbn": "978-3-030-62465-1"
    }, 
    "communities": [
      {
        "id": "nexuslinguarum"
      }, 
      {
        "id": "pret-a-llod"
      }
    ], 
    "grants": [
      {
        "code": "825182", 
        "links": {
          "self": "https://zenodo.org/api/grants/10.13039/501100000780::825182"
        }, 
        "title": "Ready-to-use Multilingual Linked Language Data for Knowledge Services across Sectors", 
        "acronym": "Pret-a-LLOD", 
        "program": "H2020", 
        "funder": {
          "doi": "10.13039/501100000780", 
          "acronyms": [], 
          "name": "European Commission", 
          "links": {
            "self": "https://zenodo.org/api/funders/10.13039/501100000780"
          }
        }
      }
    ], 
    "keywords": [
      "Apertium RDF, cross-lingual model transfer, Fintan"
    ], 
    "publication_date": "2020-11-01", 
    "creators": [
      {
        "orcid": "0000-0001-6452-7627", 
        "affiliation": "University of Zaragoza", 
        "name": "Jorge Gracia"
      }, 
      {
        "affiliation": "Goethe University Frankfurt", 
        "name": "Christian F\u00e4th"
      }, 
      {
        "affiliation": "Semalytix GmbH", 
        "name": "Matthias Hartung"
      }, 
      {
        "affiliation": "Goethe University Frankfurt", 
        "name": "Max Ionov"
      }, 
      {
        "affiliation": "University of Zaragoza", 
        "name": "Julia Bosque-Gil"
      }, 
      {
        "affiliation": "Semalytix GmbH", 
        "name": "Susana Ver\u00edssimo"
      }, 
      {
        "affiliation": "Goethe University Frankfurt", 
        "name": "Christian Chiarcos"
      }, 
      {
        "affiliation": "Semalytix GmbH", 
        "name": "Matthias Orlikowski"
      }
    ], 
    "meeting": {
      "acronym": "ISWC 2020", 
      "dates": "2-6 November  2020", 
      "title": "19th International Semantic Web Conference"
    }, 
    "subjects": [], 
    "resource_type": {
      "subtype": "conferencepaper", 
      "type": "publication", 
      "title": "Conference paper"
    }, 
    "description": "<p>We describe the use of linguistic linked data to support a cross-lingual transfer framework for sentiment analysis in the pharmaceutical domain. The proposed system dynamically gathers translations from the Linked Open Data (LOD) cloud, particularly from Apertium RDF, in order to project a deep learning-based sentiment classifier from one language to another, thus enabling scalability and avoiding the need of model re-training when transferred across languages. We describe the whole pipeline traversed by the multilingual data, from their conversion into RDF based on a new dynamic and flexible transformation framework, through their linking and publication as linked data, and finally their exploitation in the particular use case. Based on experiments on projecting a sentiment classifier from English to Spanish, we demonstrate how linked data techniques are able to enhance the multilingual capabilities of a deep learning-based approach in a dynamic and scalable way, in a real application scenario from the pharmaceutical domain.</p>"
  }
}
24
35
views
downloads
Views 24
Downloads 35
Data volume 25.2 MB
Unique views 23
Unique downloads 34

Share

Cite as