Preprint Open Access

Using logical constraints to validate information in collaborative knowledge graphs: a study of COVID-19 on Wikidata

Houcemeddine Turki; Dariusz Jemielniak; Mohamed Ali Hadj Taieb; Jose Emilio Labra Gayo; Mohamed Ben Aouicha; Mus'ab Banat; Thomas Shafee; Eric Prud'Hommeaux; Tiago Lubiana; Diptanshu Das; Daniel Mietchen


DataCite XML Export

<?xml version='1.0' encoding='utf-8'?>
<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4" xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.1/metadata.xsd">
  <identifier identifierType="DOI">10.5281/zenodo.4445363</identifier>
  <creators>
    <creator>
      <creatorName>Houcemeddine Turki</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0003-3492-2014</nameIdentifier>
      <affiliation>Faculty of Medicine of Sfax, University of Sfax, Sfax, Tunisia</affiliation>
    </creator>
    <creator>
      <creatorName>Dariusz Jemielniak</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0002-3745-7931</nameIdentifier>
      <affiliation>Department of Management in Networked and Digital Societies, Kozminski University, Warsaw, Poland</affiliation>
    </creator>
    <creator>
      <creatorName>Mohamed Ali Hadj Taieb</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0002-2786-8913</nameIdentifier>
      <affiliation>Faculty of Sciences of Sfax, University of Sfax, Sfax, Tunisia</affiliation>
    </creator>
    <creator>
      <creatorName>Jose Emilio Labra Gayo</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0001-8907-5348</nameIdentifier>
      <affiliation>Web Semantics Oviedo (WESO) Research Group, University of Oviedo, Spain</affiliation>
    </creator>
    <creator>
      <creatorName>Mohamed Ben Aouicha</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0002-2277-5814</nameIdentifier>
      <affiliation>Faculty of Sciences of Sfax, University of Sfax, Sfax, Tunisia</affiliation>
    </creator>
    <creator>
      <creatorName>Mus'ab Banat</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0001-9132-3849</nameIdentifier>
      <affiliation>Faculty of Medicine, Hashemite University, Zarqa, Jordan</affiliation>
    </creator>
    <creator>
      <creatorName>Thomas Shafee</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0002-2298-7593</nameIdentifier>
      <affiliation>La Trobe University, Melbourne, Victoria, Australia</affiliation>
    </creator>
    <creator>
      <creatorName>Eric Prud'Hommeaux</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0003-1775-9921</nameIdentifier>
      <affiliation>World Wide Web Consortium, Cambridge, Massachusetts, United States of America</affiliation>
    </creator>
    <creator>
      <creatorName>Tiago Lubiana</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0003-2473-2313</nameIdentifier>
      <affiliation>Computational Systems Biology Laboratory, University of São Paulo, São Paulo, Brazil</affiliation>
    </creator>
    <creator>
      <creatorName>Diptanshu Das</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0002-7221-5022</nameIdentifier>
      <affiliation>Institute of Child Health (ICH), Kolkata, India</affiliation>
    </creator>
    <creator>
      <creatorName>Daniel Mietchen</creatorName>
      <nameIdentifier nameIdentifierScheme="ORCID" schemeURI="http://orcid.org/">0000-0001-9488-1870</nameIdentifier>
      <affiliation>School of Data Science, University of Virginia, Charlottesville, Virginia, United States of America</affiliation>
    </creator>
  </creators>
  <titles>
    <title>Using logical constraints to validate information in collaborative knowledge graphs: a study of COVID-19 on Wikidata</title>
  </titles>
  <publisher>Zenodo</publisher>
  <publicationYear>2020</publicationYear>
  <subjects>
    <subject>SPARQL</subject>
    <subject>Public health surveillance</subject>
    <subject>Wikidata</subject>
    <subject>Knowledge graph refinement</subject>
    <subject>COVID-19</subject>
    <subject>Validation constraints</subject>
  </subjects>
  <dates>
    <date dateType="Issued">2020-08-30</date>
  </dates>
  <language>en</language>
  <resourceType resourceTypeGeneral="Preprint"/>
  <alternateIdentifiers>
    <alternateIdentifier alternateIdentifierType="url">https://zenodo.org/record/4445363</alternateIdentifier>
  </alternateIdentifiers>
  <relatedIdentifiers>
    <relatedIdentifier relatedIdentifierType="DOI" relationType="IsVersionOf">10.5281/zenodo.4008358</relatedIdentifier>
    <relatedIdentifier relatedIdentifierType="URL" relationType="IsPartOf">https://zenodo.org/communities/africarxiv</relatedIdentifier>
    <relatedIdentifier relatedIdentifierType="URL" relationType="IsPartOf">https://zenodo.org/communities/bioinformatics</relatedIdentifier>
    <relatedIdentifier relatedIdentifierType="URL" relationType="IsPartOf">https://zenodo.org/communities/covid-19</relatedIdentifier>
  </relatedIdentifiers>
  <rightsList>
    <rights rightsURI="https://creativecommons.org/licenses/by/4.0/legalcode">Creative Commons Attribution 4.0 International</rights>
    <rights rightsURI="info:eu-repo/semantics/openAccess">Open Access</rights>
  </rightsList>
  <descriptions>
    <description descriptionType="Abstract">&lt;p&gt;Urgent global research demands real-time dissemination of precise data. Wikidata, a collaborative and openly licensed knowledge graph available in RDF format, provides a forum for exchanging structured data. In this research paper, we catalog the rules describing relational and statistical COVID-19 epidemiological data and implement them in SPARQL, a query language for semantic databases. We demonstrate the efficiency of our methods to evaluate structured information, particularly COVID-19 knowledge in Wikidata, and consequently in collaborative ontologies and knowledge graphs, and we show the advantages and drawbacks of our proposed approach by comparing it to other methods for validation of linked web data.&lt;/p&gt;

&lt;p&gt;This paper is a preprint and has not yet received peer-review.&lt;/p&gt;</description>
  </descriptions>
</resource>
2,224
673
views
downloads
All versions This version
Views 2,224634
Downloads 673130
Data volume 925.5 MB197.9 MB
Unique views 2,005626
Unique downloads 628129

Share

Cite as